|
1 | 1 | import parsion |
2 | 2 | import re |
3 | 3 |
|
| 4 | + |
4 | 5 | class ExprLang(parsion.Parsion): |
5 | 6 | SELF_CHECK = True |
6 | | - |
| 7 | + |
7 | 8 | LEXER_RULES = [ |
8 | | - (None, r'(\s+)', lambda x: None), |
| 9 | + (None, r'(\s+)', lambda x: None), |
9 | 10 |
|
10 | 11 | ('STR', r'("(?:[^"\\]|\\.)*")', |
11 | 12 | lambda x: re.sub(r'\\(.)', r'\1', x[1:-1])), |
12 | | - ('FLOAT', r'([0-9]+\.[0-9]*)', lambda x: float(x)), |
13 | | - ('INT', r'([0-9]+|0x[0-9a-fA-F]+)', lambda x: int(x,base=0)), |
14 | | - |
15 | | - ('FOR', r'(for)(?:[^a-z0-9_]|$)', lambda x: None), |
16 | | - ('IN', r'(in)(?:[^a-z0-9_]|$)', lambda x: None), |
17 | | - ('IF', r'(if)(?:[^a-z0-9_]|$)', lambda x: None), |
18 | | - ('THEN', r'(then)(?:[^a-z0-9_]|$)', lambda x: None), |
19 | | - ('ELSE', r'(else)(?:[^a-z0-9_]|$)', lambda x: None), |
20 | | - |
21 | | - ('NAME', r'([a-zA-Z0-9_]+)', lambda x: x), |
22 | | - |
23 | | - ('==', r'(==)', lambda x: None), |
24 | | - |
25 | | - ('-', r'(-)', lambda x: None), |
26 | | - ('+', r'(\+)', lambda x: None), |
27 | | - ('*', r'(\*)', lambda x: None), |
28 | | - ('/', r'(\/)', lambda x: None), |
29 | | - |
30 | | - (',', r'(,)', lambda x: None), |
31 | | - ('.', r'(\.)', lambda x: None), |
32 | | - ('=', r'(=)', lambda x: None), |
33 | | - ('(', r'([\(])', lambda x: None), |
34 | | - (')', r'([\)])', lambda x: None), |
35 | | - ('[', r'(\[)', lambda x: None), |
36 | | - (']', r'(\])', lambda x: None), |
| 13 | + ('FLOAT', r'([0-9]+\.[0-9]*)', lambda x: float(x)), |
| 14 | + ('INT', r'([0-9]+|0x[0-9a-fA-F]+)', lambda x: int(x, base=0)), |
| 15 | + |
| 16 | + ('FOR', r'(for)(?:[^a-z0-9_]|$)', lambda x: None), |
| 17 | + ('IN', r'(in)(?:[^a-z0-9_]|$)', lambda x: None), |
| 18 | + ('IF', r'(if)(?:[^a-z0-9_]|$)', lambda x: None), |
| 19 | + ('THEN', r'(then)(?:[^a-z0-9_]|$)', lambda x: None), |
| 20 | + ('ELSE', r'(else)(?:[^a-z0-9_]|$)', lambda x: None), |
| 21 | + |
| 22 | + ('NAME', r'([a-zA-Z0-9_]+)', lambda x: x), |
| 23 | + |
| 24 | + ('==', r'(==)', lambda x: None), |
| 25 | + |
| 26 | + ('-', r'(-)', lambda x: None), |
| 27 | + ('+', r'(\+)', lambda x: None), |
| 28 | + ('*', r'(\*)', lambda x: None), |
| 29 | + ('/', r'(\/)', lambda x: None), |
| 30 | + |
| 31 | + (',', r'(,)', lambda x: None), |
| 32 | + ('.', r'(\.)', lambda x: None), |
| 33 | + ('=', r'(=)', lambda x: None), |
| 34 | + ('(', r'([\(])', lambda x: None), |
| 35 | + (')', r'([\)])', lambda x: None), |
| 36 | + ('[', r'(\[)', lambda x: None), |
| 37 | + (']', r'(\])', lambda x: None), |
37 | 38 |
|
38 | 39 | # Intended to not fail during lexing phase, but push invalid inputs |
39 | 40 | # to parsing phase, with more useful error messages |
40 | | - ('CHAR', r'(.)', lambda x: x) |
| 41 | + ('CHAR', r'(.)', lambda x: x) |
41 | 42 | ] |
42 | | - |
| 43 | + |
43 | 44 | GRAMMAR_RULES = [ |
44 | 45 | ('entry', 'entry', 'expr'), |
45 | 46 |
|
46 | 47 | ('expr_eq', 'expr', 'expr1 _== expr1'), |
47 | 48 |
|
48 | 49 | (None, 'expr', 'expr1'), |
49 | | - |
| 50 | + |
50 | 51 | ('expr_add', 'expr1', 'expr1 _+ expr2'), |
51 | 52 | ('expr_sub', 'expr1', 'expr1 _- expr2'), |
52 | | - |
| 53 | + |
53 | 54 | (None, 'expr1', 'expr2'), |
54 | | - |
| 55 | + |
55 | 56 | ('expr_mult', 'expr2', 'expr2 _* expr3'), |
56 | 57 | ('expr_div', 'expr2', 'expr2 _/ expr3'), |
57 | | - |
| 58 | + |
58 | 59 | (None, 'expr2', 'expr3'), |
59 | | - |
| 60 | + |
60 | 61 | ('expr_neg', 'expr3', '_- expr4'), |
61 | | - |
| 62 | + |
62 | 63 | (None, 'expr3', 'expr4'), |
63 | | - |
| 64 | + |
64 | 65 | ('expr_int', 'expr4', 'INT'), |
65 | 66 | ('expr_float', 'expr4', 'FLOAT'), |
66 | 67 | ('expr_var', 'expr4', 'NAME'), |
67 | 68 | ('expr_str', 'expr4', 'STR'), |
68 | | - |
| 69 | + |
69 | 70 | (None, 'expr4', '_( expr _)'), |
70 | 71 | ] |
71 | | - |
| 72 | + |
72 | 73 | def expr_eq(self, lhs, rhs): |
73 | 74 | return lhs == rhs |
74 | | - |
| 75 | + |
75 | 76 | def expr_add(self, lhs, rhs): |
76 | 77 | return lhs + rhs |
77 | | - |
| 78 | + |
78 | 79 | def expr_sub(self, lhs, rhs): |
79 | 80 | return lhs - rhs |
80 | | - |
| 81 | + |
81 | 82 | def expr_mult(self, lhs, rhs): |
82 | 83 | return lhs * rhs |
83 | | - |
| 84 | + |
84 | 85 | def expr_div(self, lhs, rhs): |
85 | 86 | return lhs // rhs |
86 | | - |
| 87 | + |
87 | 88 | def expr_neg(self, v): |
88 | 89 | return -v |
89 | | - |
| 90 | + |
90 | 91 | def expr_int(self, v): |
91 | 92 | return v |
92 | | - |
| 93 | + |
93 | 94 | def expr_float(self, v): |
94 | 95 | return v |
95 | | - |
| 96 | + |
96 | 97 | def expr_var(self, v): |
97 | 98 | return v |
98 | | - |
| 99 | + |
99 | 100 | def expr_str(self, v): |
100 | 101 | return v |
101 | 102 |
|
102 | 103 |
|
103 | 104 | if __name__ == '__main__': |
104 | 105 | # Generate the parser |
105 | 106 | parser = ExprLang() |
106 | | - |
| 107 | + |
107 | 108 | # Print the parsing tables |
108 | 109 | # This line uses "tabulate" library |
109 | | - #parser.print() |
110 | | - |
| 110 | + # parser.print() |
| 111 | + |
111 | 112 | # Parse a string |
112 | 113 | print(parser.parse('(12 + 32 * 4) / 7 + 13')) |
0 commit comments