tools/lexer_generator/backtracking_generator.py - Issue 171713005: Experimental parser: add backtracking

Unified Diff: tools/lexer_generator/backtracking_generator.py

Issue 171713005: Experimental parser: add backtracking (Closed) Base URL: https://v8.googlecode.com/svn/branches/experimental/parser

Patch Set: Created 6 years, 10 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: tools/lexer_generator/backtracking_generator.py

diff --git a/tools/lexer_generator/backtracking_generator.py b/tools/lexer_generator/backtracking_generator.py

new file mode 100644

index 0000000000000000000000000000000000000000..9bb6db6b31fc72813c5a918f3ebaed242fba0bca

--- /dev/null

+++ b/tools/lexer_generator/backtracking_generator.py

@@ -0,0 +1,149 @@

+# Redistribution and use in source and binary forms, with or without

+# modification, are permitted provided that the following conditions are

+# met:

+# * Redistributions of source code must retain the above copyright

+# notice, this list of conditions and the following disclaimer.

+# * Redistributions in binary form must reproduce the above

+# copyright notice, this list of conditions and the following

+# disclaimer in the documentation and/or other materials provided

+# with the distribution.

+# * Neither the name of Google Inc. nor the names of its

+# contributors may be used to endorse or promote products derived

+# from this software without specific prior written permission.

+# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

+# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

+# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR

+# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT

+# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

+# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT

+# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

+# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

+# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

+# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

+# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

+from transition_key import TransitionKey

+from automaton import Term, Action, Automaton

+from dfa import Dfa

+class BacktrackingGenerator(object):

+ @staticmethod

+ def generate(dfa, default_action):

+ return BacktrackingGenerator(dfa, default_action, None).__generate()

+ def __init__(self, dfa, default_action, log):

+ self.__dfa = dfa

+ self.__default_action = default_action

+ self.__log = log

+ def __generate(self):

+ dfa = self.__dfa

+ default_action = self.__default_action

+ terminal_set = dfa.terminal_set()

+ # Collect states that terminate currently.

+ action_states = {}

+ omega_states = set()

+ def f(state, acc):

+ omega_state = state.omega_transition()

+ if omega_state == None:

+ if not state in terminal_set:

+ state.key_iter().next() # should have at least one transition

+ return

+ assert omega_state in terminal_set

+ assert not state in terminal_set

+ assert not list(omega_state.key_iter())

+ omega_states.add(omega_state)

+ match_action = omega_state.action()

+ if not match_action:

+ match_action = default_action

+ action_states[state] = match_action

+ dfa.visit_all_states(f)

+ assert omega_states == terminal_set

+ # Find nodes that need backtracking edges

+ incoming_transitions = dfa.build_incoming_transitions_map()

+ backtracking_map = {}

+ store_states = set()

+ # Start node may be an edge case.

+ start_state = dfa.start_state()

+ if (not start_state in incoming_transitions and

+ not start_state in action_states):

+ action_states[start_state] = default_action

+ for state in incoming_transitions.iterkeys():

+ if state in omega_states or state in action_states:

+ continue

+ assert not state.omega_transition()

+ seen = set([state])

+ unchecked = set([state])

+ match_edge = set()

+ while unchecked:

+ next = set()

+ for unchecked_state in unchecked:

+ if not unchecked_state in incoming_transitions:

+ assert unchecked_state == start_state

+ match_edge.add(unchecked_state)

+ continue

+ for (incoming_key, incoming_state) in incoming_transitions[unchecked_state]:

+ assert not incoming_state in omega_states

+ assert not incoming_key == TransitionKey.omega()

+ if incoming_state in seen:

+ continue

+ if incoming_state in action_states:

+ match_edge.add(incoming_state)

+ seen.add(incoming_state)

+ else:

+ next.add(incoming_state)

+ seen |= unchecked

+ unchecked = next - seen

+ # accumulate unique actions

+ actions = set(map(lambda x : action_states[x].term(), match_edge))

+ assert actions

+ if not len(actions) == 1:

+ # TODO(dcarney): need to warn here after second pass

+ # actions = set([default_action])

+ continue

+ action = iter(actions).next()

+ # don't install default actions

+ if action == default_action.term():

+ continue

+ store_states |= match_edge

+ backtracking_map[state.node_number()] = (action, match_edge)

+ def install_backtracking_action(new_states, node_number):

+ omega_state_id = str(node_number) + '_bt'

+ key = TransitionKey.omega()

+ new_states[str(node_number)]['transitions'][key] = omega_state_id

+ # install new state

+ old_action = backtracking_map[node_number][0]

+ new_states[omega_state_id] = {

+ 'transitions' : {},

+ 'action' : Action(Term('backtrack', old_action), 0),

+ 'terminal' : True,

+ }

+ def new_state_action(old_state):

+ action = old_state.action()

+ if not old_state in store_states:

+ return action

+ term = Term('store_lexing_state')

+ if action:

+ # TODO(dcarney): split target state instead

+ term = Term('chain', term, action.term())

+ return Action(term, 0)

+ # Now generate the new dfa.

+ def convert(old_state, new_states):

+ node_number = old_state.node_number()

+ # Clone existing state.

+ new_states[str(node_number)] = {

+ 'transitions' : {

+ k : str(v.node_number()) for (k, v) in old_state.key_state_iter() },

+ 'action' : new_state_action(old_state),

+ 'terminal' : old_state in terminal_set

+ }

+ # install a backtracking action

+ if node_number in backtracking_map:

+ install_backtracking_action(new_states, node_number)

+ return new_states

+ new_states = dfa.visit_all_states(convert, {})

+ return Dfa(dfa.encoding(), str(start_state.node_number()), new_states)

« no previous file with comments | « tools/gyp/v8.gyp ('k') | tools/lexer_generator/code_generator.jinja » ('j') | no next file with comments »