tools/lexer_generator/rule_parser.py - Issue 59603003: Experimental parser: parsing regex subexpressions

Keyboard Shortcuts

	File
u :	up to issue
j / k :	jump to file after / before current file
J / K :	jump to next file with a comment after / before current file
	Side-by-side diff
i :	toggle intra-line diffs
e :	expand all comments
c :	collapse all comments
s :	toggle showing all comments
n / p :	next / previous diff chunk or comment
N / P :	next / previous comment
<Up> / <Down> :	next / previous line

	Issue
u :	up to list of issues
j / k :	jump to patch after / before current patch
o / <Enter> :	open current patch in side-by-side view
i :	open current patch in unified diff view

	Issue List
j / k :	jump to issue after / before current issue
o / <Enter> :	open current issue

Unified Diff: tools/lexer_generator/rule_parser.py

Issue 59603003: Experimental parser: parsing regex subexpressions (Closed) Base URL: https://v8.googlecode.com/svn/branches/experimental/parser

Patch Set: Created 7 years, 1 month ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: tools/lexer_generator/rule_parser.py

diff --git a/tools/lexer_generator/rule_parser.py b/tools/lexer_generator/rule_parser.py

index 46cce1378c01a6710728f89f464f02cec7857a70..61e259a70a5cac2d759a0bd75360f20091c48645 100644

--- a/tools/lexer_generator/rule_parser.py

+++ b/tools/lexer_generator/rule_parser.py

@@ -27,13 +27,17 @@

import ply.yacc as yacc

from rule_lexer import RuleLexer

+from regex_parser import RegexParser

class RuleParser:

tokens = RuleLexer.tokens

def __init__(self):

- self.aliases = {}

+ self.aliases = {

+ 'eof' : "eof rule",

+ 'any' : "any rule",

+ }

self.current_transition = None

self.rules = {}

@@ -80,28 +84,48 @@ class RuleParser:

p[0] = self.current_transition

def p_composite_regex(self, p):

- '''composite_regex : regex_part OR regex_part maybe_regex_parts

- | regex_part maybe_regex_parts'''

+ '''composite_regex : regex_parts OR regex_parts

+ | regex_parts'''

if p[len(p)-1]:

p[0] = p[1:]

else:

p[0] = p[1:-1]

- def p_maybe_regex_part(self, p):

- '''maybe_regex_parts : composite_regex

- | empty'''

- p[0] = p[1]

+ def p_regex_parts(self, p):

+ '''regex_parts : regex_part

+ | regex_part regex_parts'''

+ p[0] = p[1:]

def p_regex_part(self, p):

'''regex_part : LEFT_PARENTHESIS composite_regex RIGHT_PARENTHESIS modifier

- | STRING_REGEX modifier

- | CHARACTER_CLASS_REGEX modifier

- | IDENTIFIER modifier'''

+ | regex_string_literal modifier

+ | regex_class modifier

+ | regex modifier

+ | regex_alias modifier'''

if p[len(p)-1]:

p[0] = p[1:]

else:

p[0] = p[1:-1]

+ def p_regex_string_literal(self, p):

+ 'regex_string_literal : STRING'

+ string = p[1][1:-1]

+ for c in "\+?|*[]()":

+ string = string.replace(c, "\\" + c)

+ p[0] = RegexParser.parse(string)

+ def p_regex(self, p):

+ 'regex : REGEX'

+ p[0] = RegexParser.parse(p[1][1:-1])

+ def p_regex_class(self, p):

+ 'regex_class : CHARACTER_CLASS_REGEX'

+ p[0] = RegexParser.parse(p[1])

+ def p_regex_alias(self, p):

+ 'regex_alias : IDENTIFIER'

+ p[0] = self.aliases[p[1]]

def p_modifier(self, p):

'''modifier : PLUS

| QUESTION_MARK

« no previous file with comments | « tools/lexer_generator/rule_lexer.py ('k') | no next file » | no next file with comments »