tools/lexer_generator/rule_parser.py - Issue 68683007: Parser generator: more layering refactoring

Unified Diff: tools/lexer_generator/rule_parser.py

Issue 68683007: Parser generator: more layering refactoring (Closed) Base URL: https://v8.googlecode.com/svn/branches/experimental/parser

Patch Set: Created 7 years, 1 month ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: tools/lexer_generator/rule_parser.py

diff --git a/tools/lexer_generator/rule_parser.py b/tools/lexer_generator/rule_parser.py

index 9652ee67b15a64bdab4fb43f4a1c27e4f3894728..76bd1fe0fe132fef4d13548ec5a829abe89b2d8e 100644

--- a/tools/lexer_generator/rule_parser.py

+++ b/tools/lexer_generator/rule_parser.py

@@ -29,6 +29,7 @@ import ply.yacc as yacc

from rule_lexer import RuleLexer

from regex_parser import RegexParser

from nfa_builder import NfaBuilder

+from dfa import Dfa

from transition_keys import TransitionKey

class RuleParserState:

@@ -212,3 +213,73 @@ class RuleParser:

raise

parser.__state = None

assert parser_state.transitions <= set(parser_state.rules.keys())

+class RuleProcessor(object):

+ def __init__(self, parser_state):

+ self.__automata = {}

+ self.__process_parser_state(parser_state)

+ @staticmethod

+ def parse(string):

+ parser_state = RuleParserState()

+ RuleParser.parse(string, parser_state)

+ return RuleProcessor(parser_state)

+ def automata_iter(self):

+ return iter(self.__automata.items())

+ def default_automata(self):

+ return self.__automata['default']

+ def lex(self, string):

+ (nfa, dfa) = self.default_automata()

+ return dfa.lex(string)

+ def __process_parser_state(self, parser_state):

+ rule_map = {}

+ builder = NfaBuilder()

+ builder.set_character_classes(parser_state.character_classes)

+ assert 'default' in parser_state.rules

+ def process(k, v):

+ graphs = []

+ continues = 0

+ for (graph, (precedence, code, transition)) in v['regex']:

+ default_code = v['default_action']

+ action = code if code else default_code

+ if action:

+ graph = NfaBuilder.add_action(graph, (precedence, action))

+ if not transition or transition == 'break':

+ pass

+ elif transition == 'continue':

+ assert not k == 'default'

+ continues += 1

+ graph = NfaBuilder.add_continue(graph)

+ elif (transition == 'terminate' or

+ transition == 'terminate_illegal'):

+ assert not code

+ graph = NfaBuilder.add_action(graph, (-1, transition))

+ else:

+ assert k == 'default'

+ subgraph_modifier = '*' if code else None

+ graph = NfaBuilder.join_subgraph(

+ graph, transition, rule_map[transition], subgraph_modifier)

+ graphs.append(graph)

+ if continues == len(graphs):

+ graphs.append(NfaBuilder.epsilon())

+ if v['catch_all']:

+ assert v['catch_all'] == 'continue'

+ graphs.append(NfaBuilder.add_continue(NfaBuilder.catch_all()))

+ graph = NfaBuilder.or_graphs(graphs)

+ rule_map[k] = graph

+ # process first the subgraphs, then the default graph

+ for k, v in parser_state.rules.items():

+ if k == 'default': continue

+ process(k, v)

+ process('default', parser_state.rules['default'])

+ # build the automata

+ for rule_name, graph in rule_map.items():

+ nfa = builder.nfa(graph)

+ (start, dfa_nodes) = nfa.compute_dfa()

+ dfa = Dfa(start, dfa_nodes)

+ self.__automata[rule_name] = (nfa, dfa)

« no previous file with comments | « tools/lexer_generator/lexer_test.py ('k') | no next file » | no next file with comments »