-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathGrammarGrep.py
56 lines (50 loc) · 2.37 KB
/
GrammarGrep.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
import ast
import RegExParser
class GrammarGrep:
def __init__(self, code: str = None):
self.code = None
self.labels = None
if code is not None:
self.load_code(code)
'note that match is greedy - so it does not get every match, but instead the longest one from each initial position'
def match(self, regex):
nfa = RegExParser.regex_to_nfa(regex)
'nfa.display_graph()'
return nfa.match_all(self.code, self.labels)
def replace(self, regex, replace_list):
nfa = RegExParser.regex_to_nfa(regex)
return nfa.replace_all(self.code, self.labels, replace_list)
def load_code(self, code: str):
labels = {}
class LabelVisitor(ast.NodeVisitor):
def generic_visit(self, node: ast.AST):
if isinstance(node, ast.expr):
key = (node.lineno - 1, node.col_offset)
value = ("expr_type", node.end_lineno - 1, node.end_col_offset)
labels.setdefault(key, [])
labels[key].append(value)
if isinstance(node, ast.stmt):
key = (node.lineno - 1, node.col_offset)
value = ("stmt_type", node.end_lineno - 1, node.end_col_offset)
labels.setdefault(key, [])
labels[key].append(value)
if isinstance(node, ast.Name):
key = (node.lineno - 1, node.col_offset)
value = ("id_type", node.end_lineno - 1, node.end_col_offset)
labels.setdefault(key, [])
labels[key].append(value)
if isinstance(node, ast.Num):
key = (node.lineno - 1, node.col_offset)
value = ("num_type", node.end_lineno - 1, node.end_col_offset)
labels.setdefault(key, [])
labels[key].append(value)
if isinstance(node, ast.Str):
key = (node.lineno - 1, node.col_offset)
value = ("str_type", node.end_lineno - 1, node.end_col_offset)
labels.setdefault(key, [])
labels[key].append(value)
ast.NodeVisitor.generic_visit(self, node)
parsed_code = ast.parse(code)
self.code = code.splitlines()
LabelVisitor().visit(parsed_code)
self.labels = labels