Mercurial > hg > expressionparser
annotate expr.py @ 11:e17a3464a0b9
get precedence from a list position vs magic constants
| author | Jeff Hammel <jhammel@mozilla.com> |
|---|---|
| date | Fri, 03 Jun 2011 10:51:36 -0700 |
| parents | 15fb1081784f |
| children | 835efd8acb04 |
| rev | line source |
|---|---|
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
1 #!/usr/bin/env python |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
2 |
|
2
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
3 # Implements a top-down parser/evaluator for simple boolean expressions. |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
4 # ideas taken from http://effbot.org/zone/simple-top-down-parsing.htm |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
5 # |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
6 # Rough grammar: |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
7 # expr := literal |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
8 # | '(' expr ')' |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
9 # | expr '&&' expr |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
10 # | expr '||' expr |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
11 # | expr '==' expr |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
12 # | expr '!=' expr |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
13 # literal := BOOL |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
14 # | INT |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
15 # | STRING |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
16 # | IDENT |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
17 # BOOL := true|false |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
18 # INT := [0-9]+ |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
19 # STRING := "[^"]*" |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
20 # IDENT := [A-Za-z_]\w* |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
21 |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
22 # Identifiers take their values from a mapping dictionary passed as the second |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
23 # argument. |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
24 |
|
10
15fb1081784f
add ExpressionParser to the exports
Jeff Hammel <jhammel@mozilla.com>
parents:
9
diff
changeset
|
25 __all__ = ['parse', 'ParseError', 'ExpressionParser'] |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
26 import re |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
27 |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
28 # token classes |
|
10
15fb1081784f
add ExpressionParser to the exports
Jeff Hammel <jhammel@mozilla.com>
parents:
9
diff
changeset
|
29 class token(object): |
|
15fb1081784f
add ExpressionParser to the exports
Jeff Hammel <jhammel@mozilla.com>
parents:
9
diff
changeset
|
30 pass |
|
15fb1081784f
add ExpressionParser to the exports
Jeff Hammel <jhammel@mozilla.com>
parents:
9
diff
changeset
|
31 |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
32 class ident_token(object): |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
33 def __init__(self, value): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
34 self.value = value |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
35 def nud(self, parser): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
36 # identifiers take their value from the value mappings passed |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
37 # to the parser |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
38 return parser.value(self.value) |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
39 |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
40 class literal_token(object): |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
41 def __init__(self, value): |
|
3
5ac8eed85684
consolidate token classes
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
2
diff
changeset
|
42 self.value = value |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
43 def nud(self, parser): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
44 return self.value |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
45 |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
46 class eq_op_token(object): |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
47 "==" |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
48 def led(self, parser, left): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
49 return left == parser.expression(self.lbp) |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
50 |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
51 class neq_op_token(object): |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
52 "!=" |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
53 def led(self, parser, left): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
54 return left != parser.expression(self.lbp) |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
55 |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
56 class and_op_token(object): |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
57 "&&" |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
58 def led(self, parser, left): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
59 right = parser.expression(self.lbp) |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
60 return left and right |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
61 |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
62 class or_op_token(object): |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
63 "||" |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
64 def led(self, parser, left): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
65 right = parser.expression(self.lbp) |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
66 return left or right |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
67 |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
68 class lparen_token(object): |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
69 "(" |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
70 def nud(self, parser): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
71 expr = parser.expression() |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
72 parser.advance(rparen_token) |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
73 return expr |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
74 |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
75 class rparen_token(object): |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
76 ")" |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
77 |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
78 class end_token(object): |
|
11
e17a3464a0b9
get precedence from a list position vs magic constants
Jeff Hammel <jhammel@mozilla.com>
parents:
10
diff
changeset
|
79 """always ends parsing""" |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
80 |
| 8 | 81 ### derived literal tokens |
| 82 | |
|
7
325dccc38308
begin using subclasses for tokens; the eventual goal is that a token class will know everything it can about what it is and the parser just knows about what tokens are
Jeff Hammel <jhammel@mozilla.com>
parents:
4
diff
changeset
|
83 class bool_token(literal_token): |
|
325dccc38308
begin using subclasses for tokens; the eventual goal is that a token class will know everything it can about what it is and the parser just knows about what tokens are
Jeff Hammel <jhammel@mozilla.com>
parents:
4
diff
changeset
|
84 def __init__(self, value): |
|
325dccc38308
begin using subclasses for tokens; the eventual goal is that a token class will know everything it can about what it is and the parser just knows about what tokens are
Jeff Hammel <jhammel@mozilla.com>
parents:
4
diff
changeset
|
85 value = {'true':True, 'false':False}[value] |
|
325dccc38308
begin using subclasses for tokens; the eventual goal is that a token class will know everything it can about what it is and the parser just knows about what tokens are
Jeff Hammel <jhammel@mozilla.com>
parents:
4
diff
changeset
|
86 literal_token.__init__(self, value) |
|
325dccc38308
begin using subclasses for tokens; the eventual goal is that a token class will know everything it can about what it is and the parser just knows about what tokens are
Jeff Hammel <jhammel@mozilla.com>
parents:
4
diff
changeset
|
87 |
| 8 | 88 class int_token(literal_token): |
| 89 def __init__(self, value): | |
| 90 literal_token.__init__(self, int(value)) | |
| 91 | |
| 9 | 92 class string_token(literal_token): |
| 93 def __init__(self, value): | |
| 94 literal_token.__init__(self, value[1:-1]) | |
| 95 | |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
96 precedence = [(end_token, rparen_token), |
|
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
97 (or_op_token,), |
|
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
98 (and_op_token,), |
|
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
99 (eq_op_token, neq_op_token), |
|
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
100 (lparen_token,), |
|
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
101 ] |
|
11
e17a3464a0b9
get precedence from a list position vs magic constants
Jeff Hammel <jhammel@mozilla.com>
parents:
10
diff
changeset
|
102 for index, rank in enumerate(precedence): |
|
e17a3464a0b9
get precedence from a list position vs magic constants
Jeff Hammel <jhammel@mozilla.com>
parents:
10
diff
changeset
|
103 for token in rank: |
|
e17a3464a0b9
get precedence from a list position vs magic constants
Jeff Hammel <jhammel@mozilla.com>
parents:
10
diff
changeset
|
104 token.lbp = index # lbp = lowest left binding power |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
105 |
|
2
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
106 class ParseError(Exception): |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
107 """errror parsing conditional expression""" |
|
2
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
108 |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
109 class ExpressionParser(object): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
110 def __init__(self, text, valuemapping): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
111 """ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
112 Initialize the parser with input |text|, and |valuemapping| as |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
113 a dict mapping identifier names to values. |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
114 """ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
115 self.text = text |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
116 self.valuemapping = valuemapping |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
117 |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
118 def _tokenize(self): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
119 """ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
120 Lex the input text into tokens and yield them in sequence. |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
121 """ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
122 # scanner callbacks |
|
7
325dccc38308
begin using subclasses for tokens; the eventual goal is that a token class will know everything it can about what it is and the parser just knows about what tokens are
Jeff Hammel <jhammel@mozilla.com>
parents:
4
diff
changeset
|
123 def bool_(scanner, t): return bool_token(t) |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
124 def identifier(scanner, t): return ident_token(t) |
| 8 | 125 def integer(scanner, t): return int_token(t) |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
126 def eq(scanner, t): return eq_op_token() |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
127 def neq(scanner, t): return neq_op_token() |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
128 def or_(scanner, t): return or_op_token() |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
129 def and_(scanner, t): return and_op_token() |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
130 def lparen(scanner, t): return lparen_token() |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
131 def rparen(scanner, t): return rparen_token() |
| 9 | 132 def string_(scanner, t): return string_token(t) |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
133 |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
134 scanner = re.Scanner([ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
135 (r"true|false", bool_), |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
136 (r"[a-zA-Z_]\w*", identifier), |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
137 (r"[0-9]+", integer), |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
138 (r'"[^"]*"', string_), |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
139 (r"==", eq), |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
140 (r"!=", neq), |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
141 (r"\|\|", or_), |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
142 (r"&&", and_), |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
143 (r"\(", lparen), |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
144 (r"\)", rparen), |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
145 (r"\s+", None), # skip whitespace |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
146 ]) |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
147 tokens, remainder = scanner.scan(self.text) |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
148 for t in tokens: |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
149 yield t |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
150 yield end_token() |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
151 |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
152 def value(self, ident): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
153 """ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
154 Look up the value of |ident| in the value mapping passed in the |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
155 constructor. |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
156 """ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
157 return self.valuemapping[ident] |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
158 |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
159 def advance(self, expected): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
160 """ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
161 Assert that the next token is an instance of |expected|, and advance |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
162 to the next token. |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
163 """ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
164 if not isinstance(self.token, expected): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
165 raise Exception, "Unexpected token!" |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
166 self.token = self.iter.next() |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
167 |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
168 def expression(self, rbp=0): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
169 """ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
170 Parse and return the value of an expression until a token with |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
171 right binding power greater than rbp is encountered. |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
172 """ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
173 t = self.token |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
174 self.token = self.iter.next() |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
175 left = t.nud(self) |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
176 while rbp < self.token.lbp: |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
177 t = self.token |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
178 self.token = self.iter.next() |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
179 left = t.led(self, left) |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
180 return left |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
181 |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
182 def parse(self): |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
183 """ |
|
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
184 Parse and return the value of the expression in the text |
|
2
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
185 passed to the constructor. Raises a ParseError if the expression |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
186 could not be parsed. |
|
0
ae57e69e4b15
simple expression parser
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
diff
changeset
|
187 """ |
|
2
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
188 try: |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
189 self.iter = self._tokenize() |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
190 self.token = self.iter.next() |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
191 return self.expression() |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
192 except: |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
193 raise ParseError("could not parse: %s" % self.text) |
|
2
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
194 |
|
4
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
195 __call__ = parse |
|
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
196 |
|
a42bb6dc2fa7
change parse mapping to **kwargs
Jeff Hammel <jhammel@mozilla.com>
parents:
3
diff
changeset
|
197 def parse(text, **values): |
|
2
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
198 """ |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
199 Parse and evaluate a boolean expression in |text|. Use |values| to look |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
200 up the value of identifiers referenced in the expression. Returns the final |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
201 value of the expression. A ParseError will be raised if parsing fails. |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
202 """ |
|
94a293b914af
add documentation, clean up interface slightly, tweak tests
Ted Mielczarek <ted.mielczarek@gmail.com>
parents:
1
diff
changeset
|
203 return ExpressionParser(text, values).parse() |
