-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathrule_expression.py
More file actions
105 lines (88 loc) · 3.1 KB
/
rule_expression.py
File metadata and controls
105 lines (88 loc) · 3.1 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
import dataclasses
import re
from typing import *
token_word = re.compile(r'\$?[A-z|0-9_]+?(?=[()+\-\s])|\$?[A-z|0-9_]+?$')
token_symbol = re.compile(r'[()+\-]')
@dataclasses.dataclass
class Token:
content: str
span: Tuple[int, int]
type: Literal['operator', 'name']
level: int = 0
def to_ast(text: str) -> List[Token]:
words = (Token(x.group(), x.span(), 'name')
for x in re.finditer(token_word, text))
symbols = (Token(x.group(), x.span(), 'operator')
for x in re.finditer(token_symbol, text))
tokens = []
tokens.extend(words)
tokens.extend(symbols)
tokens.sort(key=lambda x: x.span[0])
# print(tokens)
c_level = 0
for x in tokens:
reduce_level = False
if x.type == 'operator':
if x.content == '(':
c_level += 1
reduce_level = True
elif x.content == ')':
c_level -= 1
# elif x.type == 'name':
# if x.content.startswith('$'):
# pass
if c_level < 0:
raise RuntimeError(f'bracket miss matched {x}')
x.level = c_level - 1 if reduce_level else c_level
return tokens
def operate(symbol: Literal['+', '-'], data: List[Any], value: List[Any]) -> List[Any]:
if symbol == '+':
data.extend(x for x in value if x not in data)
elif symbol == '-':
data = [x for x in data if x not in value]
else:
raise NotImplementedError()
return data
def execute(tokens: List[Token], rules: Dict[str, List[Any]]) -> List[Any]:
result = []
last_operator = None
# for i, x in enumerate(tokens):
index = 0
while True:
token = tokens[index]
value = None
if token.type == 'name':
value = rules[token.content]
if token.type == 'operator':
if token.content == '(':
next_bracket = index
while True:
next_bracket += 1
if next_bracket >= len(tokens):
raise RuntimeError(f'bracket miss matched {token}')
test_token = tokens[next_bracket]
if test_token.level == token.level and test_token.content == ')':
break
value = execute(tokens[index+1: next_bracket], rules)
index += next_bracket
elif token.content == ')':
raise RuntimeError()
else:
last_operator = token.content
if last_operator is not None and value is not None:
result = operate(last_operator, result, value)
elif value is not None:
result = value
index += 1
if index >= len(tokens):
break
return result
def debug_tokens(tokens: List[Token]) -> str:
return '\n'.join([' ' * x.level + x.content for x in tokens])
test = '((a+b-c)+$test-a1)+b_1'
ast = to_ast(test)
print(debug_tokens(ast))
rules1 = {'a': [1, 2, 3], 'a1': [4, 5, 6], 'b': [1, 3, 9], 'b_1': [2, 4, 6], 'c': [2],
'$test': [1, 2, 3, 4, 5, 6, 7, 8, 9]}
r = execute(ast, rules1)
print(r)