bindings/scripts/blink_idl_parser.py - Issue 540533002: Roll IDL to Dartium37 (r181268)

Unified Diff: bindings/scripts/blink_idl_parser.py

Issue 540533002: Roll IDL to Dartium37 (r181268) (Closed) Base URL: https://dart.googlecode.com/svn/third_party/WebCore

Patch Set: Created 6 years, 3 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: bindings/scripts/blink_idl_parser.py

diff --git a/bindings/scripts/blink_idl_parser.py b/bindings/scripts/blink_idl_parser.py

new file mode 100644

index 0000000000000000000000000000000000000000..6b205f2421c0c3f18ac2d51bad1fdce7988fe697

--- /dev/null

+++ b/bindings/scripts/blink_idl_parser.py

@@ -0,0 +1,446 @@

+# Redistribution and use in source and binary forms, with or without

+# modification, are permitted provided that the following conditions are

+# met:

+# * Redistributions of source code must retain the above copyright

+# notice, this list of conditions and the following disclaimer.

+# * Redistributions in binary form must reproduce the above

+# copyright notice, this list of conditions and the following disclaimer

+# in the documentation and/or other materials provided with the

+# distribution.

+# * Neither the name of Google Inc. nor the names of its

+# contributors may be used to endorse or promote products derived from

+# this software without specific prior written permission.

+# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

+# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

+# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR

+# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT

+# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

+# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT

+# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

+# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

+# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

+# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

+# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

+"""Parser for Blink IDL.

+The parser uses the PLY (Python Lex-Yacc) library to build a set of parsing

+rules which understand the Blink dialect of Web IDL.

+It derives from a standard Web IDL parser, overriding rules where Blink IDL

+differs syntactically or semantically from the base parser, or where the base

+parser diverges from the Web IDL standard.

+Web IDL:

+ http://www.w3.org/TR/WebIDL/

+Web IDL Grammar:

+ http://www.w3.org/TR/WebIDL/#idl-grammar

+PLY:

+ http://www.dabeaz.com/ply/

+Design doc:

+http://www.chromium.org/developers/design-documents/idl-compiler#TOC-Front-end

+"""

+# Disable check for line length and Member as Function due to how grammar rules

+# are defined with PLY

+# pylint: disable=R0201

+# pylint: disable=C0301

+# Disable attribute validation, as lint can't import parent class to check

+# pylint: disable=E1101

+import os.path

+import sys

+# PLY is in Chromium src/third_party/ply

+module_path, module_name = os.path.split(__file__)

+third_party = os.path.join(module_path, os.pardir, os.pardir, os.pardir, os.pardir)

+# Insert at front to override system libraries, and after path[0] == script dir

+sys.path.insert(1, third_party)

+from ply import yacc

+# Base parser is in Chromium src/tools/idl_parser

+tools_dir = os.path.join(module_path, os.pardir, os.pardir, os.pardir, os.pardir, os.pardir, 'tools')

+sys.path.append(tools_dir)

+from idl_parser.idl_parser import IDLParser, ListFromConcat

+from idl_parser.idl_parser import ParseFile as parse_file

+from blink_idl_lexer import BlinkIDLLexer

+# Explicitly set starting symbol to rule defined only in base parser.

+# BEWARE that the starting symbol should NOT be defined in both the base parser

+# and the derived one, as otherwise which is used depends on which line number

+# is lower, which is fragile. Instead, either use one in base parser or

+# create a new symbol, so that this is unambiguous.

+# FIXME: unfortunately, this doesn't work in PLY 3.4, so need to duplicate the

+# rule below.

+STARTING_SYMBOL = 'Definitions'

+# We ignore comments (and hence don't need 'Top') but base parser preserves them

+# FIXME: Upstream: comments should be removed in base parser

+REMOVED_RULES = ['Top', # [0]

+ 'Comments', # [0.1]

+ 'CommentsRest', # [0.2]

+ ]

+# Remove rules from base class

+# FIXME: add a class method upstream: @classmethod IDLParser._RemoveRules

+for rule in REMOVED_RULES:

+ production_name = 'p_' + rule

+ delattr(IDLParser, production_name)

+class BlinkIDLParser(IDLParser):

+ # [1]

+ # FIXME: Need to duplicate rule for starting symbol here, with line number

+ # *lower* than in the base parser (idl_parser.py).

+ # This is a bug in PLY: it determines starting symbol by lowest line number.

+ # This can be overridden by the 'start' parameter, but as of PLY 3.4 this

+ # doesn't work correctly.

+ def p_Definitions(self, p):

+ """Definitions : ExtendedAttributeList Definition Definitions

+ | """

+ if len(p) > 1:

+ p[2].AddChildren(p[1])

+ p[0] = ListFromConcat(p[2], p[3])

+ # Below are grammar rules used by yacc, given by functions named p_<RULE>.

+ # * The docstring is the production rule in BNF (grammar).

+ # * The body is the yacc action (semantics).

+ #

+ # The PLY framework builds the actual low-level parser by introspecting this

+ # parser object, selecting all attributes named p_<RULE> as grammar rules.

+ # It extracts the docstrings and uses them as the production rules, building

+ # the table of a LALR parser, and uses the body of the functions as actions.

+ #

+ # Reference:

+ # http://www.dabeaz.com/ply/ply.html#ply_nn23

+ #

+ # Review of yacc:

+ # Yacc parses a token stream, internally producing a Concrete Syntax Tree

+ # (CST), where each node corresponds to a production rule in the grammar.

+ # At each node, it runs an action, which is usually "produce a node in the

+ # Abstract Syntax Tree (AST)" or "ignore this node" (for nodes in the CST

+ # that aren't included in the AST, since only needed for parsing).

+ #

+ # The rules use pseudo-variables; in PLY syntax:

+ # p[0] is the left side: assign return value to p[0] instead of returning,

+ # p[1] ... p[n] are the right side: the values can be accessed, and they

+ # can be modified.

+ # (In yacc these are $$ and $1 ... $n.)

+ #

+ # The rules can look cryptic at first, but there are a few standard

+ # transforms from the CST to AST. With these in mind, the actions should

+ # be reasonably legible.

+ #

+ # * Ignore production

+ # Discard this branch. Primarily used when one alternative is empty.

+ #

+ # Sample code:

+ # if len(p) > 1:

+ # p[0] = ...

+ # # Note no assignment if len(p) == 1

+ #

+ # * Eliminate singleton production

+ # Discard this node in the CST, pass the next level down up the tree.

+ # Used to ignore productions only necessary for parsing, but not needed

+ # in the AST.

+ #

+ # Sample code:

+ # p[0] = p[1]

+ #

+ # * Build node

+ # The key type of rule. In this parser, produces object of class IDLNode.

+ # There are several helper functions:

+ # * BuildProduction: actually builds an IDLNode, based on a production.

+ # * BuildAttribute: builds an IDLAttribute, which is a temporary

+ # object to hold a name-value pair, which is then

+ # set as a Property of the IDLNode when the IDLNode

+ # is built.

+ # * BuildNamed: Same as BuildProduction, and sets the 'NAME' property.

+ # * BuildTrue: BuildAttribute with value True, for flags.

+ # See base idl_parser.py for definitions and more examples of use.

+ #

+ # Sample code:

+ # # Build node of type NodeType, with value p[1], and children.

+ # p[0] = self.BuildProduction('NodeType', p, 1, children)

+ #

+ # # Build named node of type NodeType, with name and value p[1].

+ # # (children optional)

+ # p[0] = self.BuildNamed('NodeType', p, 1)

+ #

+ # # Make a list

+ # # Used if one node has several children.

+ # children = ListFromConcat(p[2], p[3])

+ # p[0] = self.BuildProduction('NodeType', p, 1, children)

+ #

+ # # Also used to collapse the right-associative tree

+ # # produced by parsing a list back into a single list.

+ # """Foos : Foo Foos

+ # |"""

+ # if len(p) > 1:

+ # p[0] = ListFromConcat(p[1], p[2])

+ #

+ # # Add children.

+ # # Primarily used to add attributes, produced via BuildTrue.

+ # # p_StaticAttribute

+ # """StaticAttribute : STATIC Attribute"""

+ # p[2].AddChildren(self.BuildTrue('STATIC'))

+ # p[0] = p[2]

+ #

+ # Numbering scheme for the rules is:

+ # [1] for Web IDL spec (or additions in base parser)

+ # These should all be upstreamed to the base parser.

+ # [b1] for Blink IDL changes (overrides Web IDL)

+ # [b1.1] for Blink IDL additions, auxiliary rules for [b1]

+ # Numbers are as per Candidate Recommendation 19 April 2012:

+ # http://www.w3.org/TR/2012/CR-WebIDL-20120419/

+ # [3] Override action, since we distinguish callbacks

+ # FIXME: Upstream

+ def p_CallbackOrInterface(self, p):

+ """CallbackOrInterface : CALLBACK CallbackRestOrInterface

+ | Interface"""

+ if len(p) > 2:

+ p[2].AddChildren(self.BuildTrue('CALLBACK'))

+ p[0] = p[2]

+ else:

+ p[0] = p[1]

+ # [b27] Add strings, more 'Literal' productions

+ # 'Literal's needed because integers and strings are both internally strings

+ def p_ConstValue(self, p):

+ """ConstValue : BooleanLiteral

+ | FloatLiteral

+ | IntegerLiteral

+ | StringLiteral

+ | null"""

+ # Standard is (no 'string', fewer 'Literal's):

+ # ConstValue : BooleanLiteral

+ # | FloatLiteral

+ # | integer

+ # | NULL

+ p[0] = p[1]

+ # [b27.1]

+ def p_IntegerLiteral(self, p):

+ """IntegerLiteral : integer"""

+ p[0] = ListFromConcat(self.BuildAttribute('TYPE', 'integer'),

+ self.BuildAttribute('NAME', p[1]))

+ # [b27.2]

+ def p_StringLiteral(self, p):

+ """StringLiteral : string"""

+ p[0] = ListFromConcat(self.BuildAttribute('TYPE', 'DOMString'),

+ self.BuildAttribute('NAME', p[1]))

+ # [b47]

+ def p_ExceptionMember(self, p):

+ """ExceptionMember : Const

+ | ExceptionField

+ | Attribute

+ | ExceptionOperation"""

+ # Standard is (no Attribute, no ExceptionOperation):

+ # ExceptionMember : Const

+ # | ExceptionField

+ # FIXME: In DOMException.idl, Attributes should be changed to

+ # ExceptionFields, and Attribute removed from this rule.

+ p[0] = p[1]

+ # [b47.1]

+ def p_ExceptionOperation(self, p):

+ """ExceptionOperation : Type identifier '(' ')' ';'"""

+ # Needed to handle one case in DOMException.idl:

+ # // Override in a Mozilla compatible format

+ # [NotEnumerable] DOMString toString();

+ # Limited form of Operation to prevent others from being added.

+ # FIXME: Should be a stringifier instead.

+ p[0] = self.BuildNamed('ExceptionOperation', p, 2, p[1])

+ # Extended attributes

+ # [b49] Override base parser: remove comment field, since comments stripped

+ # FIXME: Upstream

+ def p_ExtendedAttributeList(self, p):

+ """ExtendedAttributeList : '[' ExtendedAttribute ExtendedAttributes ']'

+ | '[' ']'

+ | """

+ if len(p) > 3:

+ items = ListFromConcat(p[2], p[3])

+ p[0] = self.BuildProduction('ExtAttributes', p, 1, items)

+ # [b50] Allow optional trailing comma

+ # Blink-only, marked as WONTFIX in Web IDL spec:

+ # https://www.w3.org/Bugs/Public/show_bug.cgi?id=22156

+ def p_ExtendedAttributes(self, p):

+ """ExtendedAttributes : ',' ExtendedAttribute ExtendedAttributes

+ | ','

+ |"""

+ if len(p) > 3:

+ p[0] = ListFromConcat(p[2], p[3])

+ # [b51] Add ExtendedAttributeIdentAndOrIdent

+ def p_ExtendedAttribute(self, p):

+ """ExtendedAttribute : ExtendedAttributeNoArgs

+ | ExtendedAttributeArgList

+ | ExtendedAttributeIdent

+ | ExtendedAttributeIdentList

+ | ExtendedAttributeStringLiteralList

+ | ExtendedAttributeNamedArgList"""

+ p[0] = p[1]

+ # [59]

+ # FIXME: Upstream UnionType

+ def p_UnionType(self, p):

+ """UnionType : '(' UnionMemberType OR UnionMemberType UnionMemberTypes ')'"""

+ members = ListFromConcat(p[2], p[4], p[5])

+ p[0] = self.BuildProduction('UnionType', p, 1, members)

+ # [60]

+ def p_UnionMemberType(self, p):

+ """UnionMemberType : NonAnyType

+ | UnionType TypeSuffix

+ | ANY '[' ']' TypeSuffix"""

+ if len(p) == 2:

+ p[0] = self.BuildProduction('Type', p, 1, p[1])

+ elif len(p) == 3:

+ p[0] = self.BuildProduction('Type', p, 1, ListFromConcat(p[1], p[2]))

+ else:

+ any_node = ListFromConcat(self.BuildProduction('Any', p, 1), p[4])

+ p[0] = self.BuildProduction('Type', p, 1, any_node)

+ # [61]

+ def p_UnionMemberTypes(self, p):

+ """UnionMemberTypes : OR UnionMemberType UnionMemberTypes

+ |"""

+ if len(p) > 2:

+ p[0] = ListFromConcat(p[2], p[3])

+ # [70] Override base parser to remove non-standard sized array

+ # FIXME: Upstream

+ def p_TypeSuffix(self, p):

+ """TypeSuffix : '[' ']' TypeSuffix

+ | '?' TypeSuffixStartingWithArray

+ |"""

+ if len(p) == 4:

+ p[0] = self.BuildProduction('Array', p, 1, p[3])

+ elif len(p) == 3:

+ p[0] = ListFromConcat(self.BuildTrue('NULLABLE'), p[2])

+ # [b76.1] Add support for compound Extended Attribute values (A&B and A|B)

+ def p_ExtendedAttributeIdentList(self, p):

+ """ExtendedAttributeIdentList : identifier '=' identifier '&' IdentAndList

+ | identifier '=' identifier '|' IdentOrList"""

+ value = self.BuildAttribute('VALUE', p[3] + p[4] + p[5])

+ p[0] = self.BuildNamed('ExtAttribute', p, 1, value)

+ # [b76.2] A&B&C

+ def p_IdentAndList(self, p):

+ """IdentAndList : identifier '&' IdentAndList

+ | identifier"""

+ if len(p) > 3:

+ p[0] = p[1] + p[2] + p[3]

+ else:

+ p[0] = p[1]

+ # [b76.3] A|B|C

+ def p_IdentOrList(self, p):

+ """IdentOrList : identifier '|' IdentOrList

+ | identifier"""

+ if len(p) > 3:

+ p[0] = p[1] + p[2] + p[3]

+ else:

+ p[0] = p[1]

+ # Blink extension: Add support for compound Extended Attribute values over string literals ("A"|"B")

+ def p_ExtendedAttributeStringLiteralList(self, p):

+ """ExtendedAttributeStringLiteralList : identifier '=' StringLiteralOrList"""

+ value = self.BuildAttribute('VALUE', p[3])

+ p[0] = self.BuildNamed('ExtAttribute', p, 1, value)

+ # Blink extension: one or more string literals. The values aren't propagated as literals,

+ # but their by their value only.

+ def p_StringLiteralOrList(self, p):

+ """StringLiteralOrList : StringLiteral '|' StringLiteralOrList

+ | StringLiteral"""

+ def unwrap_string(ls):

+ """Reach in and grab the string literal's "NAME"."""

+ return ls[1].value

+ if len(p) > 3:

+ p[0] = unwrap_string(p[1]) + p[2] + p[3]

+ else:

+ p[0] = unwrap_string(p[1])

+ def __init__(self,

+ # common parameters

+ debug=False,

+ # idl_parser parameters

+ lexer=None, verbose=False, mute_error=False,

+ # yacc parameters

+ outputdir='', optimize=True, write_tables=False,

+ picklefile=None):

+ if debug:

+ # Turn off optimization and caching, and write out tables,

+ # to help debugging

+ optimize = False

+ outputdir = None

+ picklefile = None

+ write_tables = True

+ if outputdir:

+ picklefile = picklefile or os.path.join(outputdir, 'parsetab.pickle')

+ lexer = lexer or BlinkIDLLexer(debug=debug,

+ outputdir=outputdir,

+ optimize=optimize)

+ self.lexer = lexer

+ self.tokens = lexer.KnownTokens()

+ # Using SLR (instead of LALR) generates the table faster,

+ # but produces the same output. This is ok b/c Web IDL (and Blink IDL)

+ # is an SLR grammar (as is often the case for simple LL(1) grammars).

+ #

+ # Optimized mode substantially decreases startup time (by disabling

+ # error checking), and also allows use of Python's optimized mode.

+ # See: Using Python's Optimized Mode

+ # http://www.dabeaz.com/ply/ply.html#ply_nn38

+ #

+ # |picklefile| allows simpler importing than |tabmodule| (parsetab.py),

+ # as we don't need to modify sys.path; virtually identical speed.

+ # See: CHANGES, Version 3.2

+ # http://ply.googlecode.com/svn/trunk/CHANGES

+ self.yaccobj = yacc.yacc(module=self,

+ start=STARTING_SYMBOL,

+ method='SLR',

+ debug=debug,

+ optimize=optimize,

+ write_tables=write_tables,

+ picklefile=picklefile)

+ self.parse_debug = debug

+ self.verbose = verbose

+ self.mute_error = mute_error

+ self._parse_errors = 0

+ self._parse_warnings = 0

+ self._last_error_msg = None

+ self._last_error_lineno = 0

+ self._last_error_pos = 0

+################################################################################

+def main(argv):

+ # If file itself executed, cache parse table

+ try:

+ outputdir = argv[1]

+ except IndexError as err:

+ print 'Usage: %s OUTPUT_DIR' % argv[0]

+ return 1

+ parser = BlinkIDLParser(outputdir=outputdir)

+if __name__ == '__main__':

+ sys.exit(main(sys.argv))

« no previous file with comments | « bindings/scripts/blink_idl_lexer.py ('k') | bindings/scripts/code_generator_v8.py » ('j') | no next file with comments »