Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(310)

Unified Diff: tools/lexer_generator/rule_parser.py

Issue 68683007: Parser generator: more layering refactoring (Closed) Base URL: https://v8.googlecode.com/svn/branches/experimental/parser
Patch Set: Created 7 years, 1 month ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
« no previous file with comments | « tools/lexer_generator/lexer_test.py ('k') | no next file » | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
Index: tools/lexer_generator/rule_parser.py
diff --git a/tools/lexer_generator/rule_parser.py b/tools/lexer_generator/rule_parser.py
index 9652ee67b15a64bdab4fb43f4a1c27e4f3894728..76bd1fe0fe132fef4d13548ec5a829abe89b2d8e 100644
--- a/tools/lexer_generator/rule_parser.py
+++ b/tools/lexer_generator/rule_parser.py
@@ -29,6 +29,7 @@ import ply.yacc as yacc
from rule_lexer import RuleLexer
from regex_parser import RegexParser
from nfa_builder import NfaBuilder
+from dfa import Dfa
from transition_keys import TransitionKey
class RuleParserState:
@@ -212,3 +213,73 @@ class RuleParser:
raise
parser.__state = None
assert parser_state.transitions <= set(parser_state.rules.keys())
+
+class RuleProcessor(object):
+
+ def __init__(self, parser_state):
+ self.__automata = {}
+ self.__process_parser_state(parser_state)
+
+ @staticmethod
+ def parse(string):
+ parser_state = RuleParserState()
+ RuleParser.parse(string, parser_state)
+ return RuleProcessor(parser_state)
+
+ def automata_iter(self):
+ return iter(self.__automata.items())
+
+ def default_automata(self):
+ return self.__automata['default']
+
+ def lex(self, string):
+ (nfa, dfa) = self.default_automata()
+ return dfa.lex(string)
+
+ def __process_parser_state(self, parser_state):
+ rule_map = {}
+ builder = NfaBuilder()
+ builder.set_character_classes(parser_state.character_classes)
+ assert 'default' in parser_state.rules
+ def process(k, v):
+ graphs = []
+ continues = 0
+ for (graph, (precedence, code, transition)) in v['regex']:
+ default_code = v['default_action']
+ action = code if code else default_code
+ if action:
+ graph = NfaBuilder.add_action(graph, (precedence, action))
+ if not transition or transition == 'break':
+ pass
+ elif transition == 'continue':
+ assert not k == 'default'
+ continues += 1
+ graph = NfaBuilder.add_continue(graph)
+ elif (transition == 'terminate' or
+ transition == 'terminate_illegal'):
+ assert not code
+ graph = NfaBuilder.add_action(graph, (-1, transition))
+ else:
+ assert k == 'default'
+ subgraph_modifier = '*' if code else None
+ graph = NfaBuilder.join_subgraph(
+ graph, transition, rule_map[transition], subgraph_modifier)
+ graphs.append(graph)
+ if continues == len(graphs):
+ graphs.append(NfaBuilder.epsilon())
+ if v['catch_all']:
+ assert v['catch_all'] == 'continue'
+ graphs.append(NfaBuilder.add_continue(NfaBuilder.catch_all()))
+ graph = NfaBuilder.or_graphs(graphs)
+ rule_map[k] = graph
+ # process first the subgraphs, then the default graph
+ for k, v in parser_state.rules.items():
+ if k == 'default': continue
+ process(k, v)
+ process('default', parser_state.rules['default'])
+ # build the automata
+ for rule_name, graph in rule_map.items():
+ nfa = builder.nfa(graph)
+ (start, dfa_nodes) = nfa.compute_dfa()
+ dfa = Dfa(start, dfa_nodes)
+ self.__automata[rule_name] = (nfa, dfa)
« no previous file with comments | « tools/lexer_generator/lexer_test.py ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698