Index: bindings/scripts/blink_idl_parser.py |
diff --git a/bindings/scripts/blink_idl_parser.py b/bindings/scripts/blink_idl_parser.py |
new file mode 100644 |
index 0000000000000000000000000000000000000000..6b205f2421c0c3f18ac2d51bad1fdce7988fe697 |
--- /dev/null |
+++ b/bindings/scripts/blink_idl_parser.py |
@@ -0,0 +1,446 @@ |
+# Copyright (C) 2013 Google Inc. All rights reserved. |
+# |
+# Redistribution and use in source and binary forms, with or without |
+# modification, are permitted provided that the following conditions are |
+# met: |
+# |
+# * Redistributions of source code must retain the above copyright |
+# notice, this list of conditions and the following disclaimer. |
+# * Redistributions in binary form must reproduce the above |
+# copyright notice, this list of conditions and the following disclaimer |
+# in the documentation and/or other materials provided with the |
+# distribution. |
+# * Neither the name of Google Inc. nor the names of its |
+# contributors may be used to endorse or promote products derived from |
+# this software without specific prior written permission. |
+# |
+# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
+# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
+# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
+# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
+# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
+# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
+# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
+# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
+# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
+# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
+# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
+ |
+"""Parser for Blink IDL. |
+ |
+The parser uses the PLY (Python Lex-Yacc) library to build a set of parsing |
+rules which understand the Blink dialect of Web IDL. |
+It derives from a standard Web IDL parser, overriding rules where Blink IDL |
+differs syntactically or semantically from the base parser, or where the base |
+parser diverges from the Web IDL standard. |
+ |
+Web IDL: |
+ http://www.w3.org/TR/WebIDL/ |
+Web IDL Grammar: |
+ http://www.w3.org/TR/WebIDL/#idl-grammar |
+PLY: |
+ http://www.dabeaz.com/ply/ |
+ |
+Design doc: |
+http://www.chromium.org/developers/design-documents/idl-compiler#TOC-Front-end |
+""" |
+ |
+# Disable check for line length and Member as Function due to how grammar rules |
+# are defined with PLY |
+# |
+# pylint: disable=R0201 |
+# pylint: disable=C0301 |
+# |
+# Disable attribute validation, as lint can't import parent class to check |
+# pylint: disable=E1101 |
+ |
+import os.path |
+import sys |
+ |
+# PLY is in Chromium src/third_party/ply |
+module_path, module_name = os.path.split(__file__) |
+third_party = os.path.join(module_path, os.pardir, os.pardir, os.pardir, os.pardir) |
+# Insert at front to override system libraries, and after path[0] == script dir |
+sys.path.insert(1, third_party) |
+from ply import yacc |
+ |
+# Base parser is in Chromium src/tools/idl_parser |
+tools_dir = os.path.join(module_path, os.pardir, os.pardir, os.pardir, os.pardir, os.pardir, 'tools') |
+sys.path.append(tools_dir) |
+from idl_parser.idl_parser import IDLParser, ListFromConcat |
+from idl_parser.idl_parser import ParseFile as parse_file |
+ |
+from blink_idl_lexer import BlinkIDLLexer |
+ |
+ |
+# Explicitly set starting symbol to rule defined only in base parser. |
+# BEWARE that the starting symbol should NOT be defined in both the base parser |
+# and the derived one, as otherwise which is used depends on which line number |
+# is lower, which is fragile. Instead, either use one in base parser or |
+# create a new symbol, so that this is unambiguous. |
+# FIXME: unfortunately, this doesn't work in PLY 3.4, so need to duplicate the |
+# rule below. |
+STARTING_SYMBOL = 'Definitions' |
+ |
+# We ignore comments (and hence don't need 'Top') but base parser preserves them |
+# FIXME: Upstream: comments should be removed in base parser |
+REMOVED_RULES = ['Top', # [0] |
+ 'Comments', # [0.1] |
+ 'CommentsRest', # [0.2] |
+ ] |
+ |
+# Remove rules from base class |
+# FIXME: add a class method upstream: @classmethod IDLParser._RemoveRules |
+for rule in REMOVED_RULES: |
+ production_name = 'p_' + rule |
+ delattr(IDLParser, production_name) |
+ |
+ |
+class BlinkIDLParser(IDLParser): |
+ # [1] |
+ # FIXME: Need to duplicate rule for starting symbol here, with line number |
+ # *lower* than in the base parser (idl_parser.py). |
+ # This is a bug in PLY: it determines starting symbol by lowest line number. |
+ # This can be overridden by the 'start' parameter, but as of PLY 3.4 this |
+ # doesn't work correctly. |
+ def p_Definitions(self, p): |
+ """Definitions : ExtendedAttributeList Definition Definitions |
+ | """ |
+ if len(p) > 1: |
+ p[2].AddChildren(p[1]) |
+ p[0] = ListFromConcat(p[2], p[3]) |
+ |
+ # Below are grammar rules used by yacc, given by functions named p_<RULE>. |
+ # * The docstring is the production rule in BNF (grammar). |
+ # * The body is the yacc action (semantics). |
+ # |
+ # The PLY framework builds the actual low-level parser by introspecting this |
+ # parser object, selecting all attributes named p_<RULE> as grammar rules. |
+ # It extracts the docstrings and uses them as the production rules, building |
+ # the table of a LALR parser, and uses the body of the functions as actions. |
+ # |
+ # Reference: |
+ # http://www.dabeaz.com/ply/ply.html#ply_nn23 |
+ # |
+ # Review of yacc: |
+ # Yacc parses a token stream, internally producing a Concrete Syntax Tree |
+ # (CST), where each node corresponds to a production rule in the grammar. |
+ # At each node, it runs an action, which is usually "produce a node in the |
+ # Abstract Syntax Tree (AST)" or "ignore this node" (for nodes in the CST |
+ # that aren't included in the AST, since only needed for parsing). |
+ # |
+ # The rules use pseudo-variables; in PLY syntax: |
+ # p[0] is the left side: assign return value to p[0] instead of returning, |
+ # p[1] ... p[n] are the right side: the values can be accessed, and they |
+ # can be modified. |
+ # (In yacc these are $$ and $1 ... $n.) |
+ # |
+ # The rules can look cryptic at first, but there are a few standard |
+ # transforms from the CST to AST. With these in mind, the actions should |
+ # be reasonably legible. |
+ # |
+ # * Ignore production |
+ # Discard this branch. Primarily used when one alternative is empty. |
+ # |
+ # Sample code: |
+ # if len(p) > 1: |
+ # p[0] = ... |
+ # # Note no assignment if len(p) == 1 |
+ # |
+ # * Eliminate singleton production |
+ # Discard this node in the CST, pass the next level down up the tree. |
+ # Used to ignore productions only necessary for parsing, but not needed |
+ # in the AST. |
+ # |
+ # Sample code: |
+ # p[0] = p[1] |
+ # |
+ # * Build node |
+ # The key type of rule. In this parser, produces object of class IDLNode. |
+ # There are several helper functions: |
+ # * BuildProduction: actually builds an IDLNode, based on a production. |
+ # * BuildAttribute: builds an IDLAttribute, which is a temporary |
+ # object to hold a name-value pair, which is then |
+ # set as a Property of the IDLNode when the IDLNode |
+ # is built. |
+ # * BuildNamed: Same as BuildProduction, and sets the 'NAME' property. |
+ # * BuildTrue: BuildAttribute with value True, for flags. |
+ # See base idl_parser.py for definitions and more examples of use. |
+ # |
+ # Sample code: |
+ # # Build node of type NodeType, with value p[1], and children. |
+ # p[0] = self.BuildProduction('NodeType', p, 1, children) |
+ # |
+ # # Build named node of type NodeType, with name and value p[1]. |
+ # # (children optional) |
+ # p[0] = self.BuildNamed('NodeType', p, 1) |
+ # |
+ # # Make a list |
+ # # Used if one node has several children. |
+ # children = ListFromConcat(p[2], p[3]) |
+ # p[0] = self.BuildProduction('NodeType', p, 1, children) |
+ # |
+ # # Also used to collapse the right-associative tree |
+ # # produced by parsing a list back into a single list. |
+ # """Foos : Foo Foos |
+ # |""" |
+ # if len(p) > 1: |
+ # p[0] = ListFromConcat(p[1], p[2]) |
+ # |
+ # # Add children. |
+ # # Primarily used to add attributes, produced via BuildTrue. |
+ # # p_StaticAttribute |
+ # """StaticAttribute : STATIC Attribute""" |
+ # p[2].AddChildren(self.BuildTrue('STATIC')) |
+ # p[0] = p[2] |
+ # |
+ # Numbering scheme for the rules is: |
+ # [1] for Web IDL spec (or additions in base parser) |
+ # These should all be upstreamed to the base parser. |
+ # [b1] for Blink IDL changes (overrides Web IDL) |
+ # [b1.1] for Blink IDL additions, auxiliary rules for [b1] |
+ # Numbers are as per Candidate Recommendation 19 April 2012: |
+ # http://www.w3.org/TR/2012/CR-WebIDL-20120419/ |
+ |
+ # [3] Override action, since we distinguish callbacks |
+ # FIXME: Upstream |
+ def p_CallbackOrInterface(self, p): |
+ """CallbackOrInterface : CALLBACK CallbackRestOrInterface |
+ | Interface""" |
+ if len(p) > 2: |
+ p[2].AddChildren(self.BuildTrue('CALLBACK')) |
+ p[0] = p[2] |
+ else: |
+ p[0] = p[1] |
+ |
+ # [b27] Add strings, more 'Literal' productions |
+ # 'Literal's needed because integers and strings are both internally strings |
+ def p_ConstValue(self, p): |
+ """ConstValue : BooleanLiteral |
+ | FloatLiteral |
+ | IntegerLiteral |
+ | StringLiteral |
+ | null""" |
+ # Standard is (no 'string', fewer 'Literal's): |
+ # ConstValue : BooleanLiteral |
+ # | FloatLiteral |
+ # | integer |
+ # | NULL |
+ p[0] = p[1] |
+ |
+ # [b27.1] |
+ def p_IntegerLiteral(self, p): |
+ """IntegerLiteral : integer""" |
+ p[0] = ListFromConcat(self.BuildAttribute('TYPE', 'integer'), |
+ self.BuildAttribute('NAME', p[1])) |
+ |
+ # [b27.2] |
+ def p_StringLiteral(self, p): |
+ """StringLiteral : string""" |
+ p[0] = ListFromConcat(self.BuildAttribute('TYPE', 'DOMString'), |
+ self.BuildAttribute('NAME', p[1])) |
+ |
+ # [b47] |
+ def p_ExceptionMember(self, p): |
+ """ExceptionMember : Const |
+ | ExceptionField |
+ | Attribute |
+ | ExceptionOperation""" |
+ # Standard is (no Attribute, no ExceptionOperation): |
+ # ExceptionMember : Const |
+ # | ExceptionField |
+ # FIXME: In DOMException.idl, Attributes should be changed to |
+ # ExceptionFields, and Attribute removed from this rule. |
+ p[0] = p[1] |
+ |
+ # [b47.1] |
+ def p_ExceptionOperation(self, p): |
+ """ExceptionOperation : Type identifier '(' ')' ';'""" |
+ # Needed to handle one case in DOMException.idl: |
+ # // Override in a Mozilla compatible format |
+ # [NotEnumerable] DOMString toString(); |
+ # Limited form of Operation to prevent others from being added. |
+ # FIXME: Should be a stringifier instead. |
+ p[0] = self.BuildNamed('ExceptionOperation', p, 2, p[1]) |
+ |
+ # Extended attributes |
+ # [b49] Override base parser: remove comment field, since comments stripped |
+ # FIXME: Upstream |
+ def p_ExtendedAttributeList(self, p): |
+ """ExtendedAttributeList : '[' ExtendedAttribute ExtendedAttributes ']' |
+ | '[' ']' |
+ | """ |
+ if len(p) > 3: |
+ items = ListFromConcat(p[2], p[3]) |
+ p[0] = self.BuildProduction('ExtAttributes', p, 1, items) |
+ |
+ # [b50] Allow optional trailing comma |
+ # Blink-only, marked as WONTFIX in Web IDL spec: |
+ # https://www.w3.org/Bugs/Public/show_bug.cgi?id=22156 |
+ def p_ExtendedAttributes(self, p): |
+ """ExtendedAttributes : ',' ExtendedAttribute ExtendedAttributes |
+ | ',' |
+ |""" |
+ if len(p) > 3: |
+ p[0] = ListFromConcat(p[2], p[3]) |
+ |
+ # [b51] Add ExtendedAttributeIdentAndOrIdent |
+ def p_ExtendedAttribute(self, p): |
+ """ExtendedAttribute : ExtendedAttributeNoArgs |
+ | ExtendedAttributeArgList |
+ | ExtendedAttributeIdent |
+ | ExtendedAttributeIdentList |
+ | ExtendedAttributeStringLiteralList |
+ | ExtendedAttributeNamedArgList""" |
+ p[0] = p[1] |
+ |
+ # [59] |
+ # FIXME: Upstream UnionType |
+ def p_UnionType(self, p): |
+ """UnionType : '(' UnionMemberType OR UnionMemberType UnionMemberTypes ')'""" |
+ members = ListFromConcat(p[2], p[4], p[5]) |
+ p[0] = self.BuildProduction('UnionType', p, 1, members) |
+ |
+ # [60] |
+ def p_UnionMemberType(self, p): |
+ """UnionMemberType : NonAnyType |
+ | UnionType TypeSuffix |
+ | ANY '[' ']' TypeSuffix""" |
+ if len(p) == 2: |
+ p[0] = self.BuildProduction('Type', p, 1, p[1]) |
+ elif len(p) == 3: |
+ p[0] = self.BuildProduction('Type', p, 1, ListFromConcat(p[1], p[2])) |
+ else: |
+ any_node = ListFromConcat(self.BuildProduction('Any', p, 1), p[4]) |
+ p[0] = self.BuildProduction('Type', p, 1, any_node) |
+ |
+ # [61] |
+ def p_UnionMemberTypes(self, p): |
+ """UnionMemberTypes : OR UnionMemberType UnionMemberTypes |
+ |""" |
+ if len(p) > 2: |
+ p[0] = ListFromConcat(p[2], p[3]) |
+ |
+ # [70] Override base parser to remove non-standard sized array |
+ # FIXME: Upstream |
+ def p_TypeSuffix(self, p): |
+ """TypeSuffix : '[' ']' TypeSuffix |
+ | '?' TypeSuffixStartingWithArray |
+ |""" |
+ if len(p) == 4: |
+ p[0] = self.BuildProduction('Array', p, 1, p[3]) |
+ elif len(p) == 3: |
+ p[0] = ListFromConcat(self.BuildTrue('NULLABLE'), p[2]) |
+ |
+ # [b76.1] Add support for compound Extended Attribute values (A&B and A|B) |
+ def p_ExtendedAttributeIdentList(self, p): |
+ """ExtendedAttributeIdentList : identifier '=' identifier '&' IdentAndList |
+ | identifier '=' identifier '|' IdentOrList""" |
+ value = self.BuildAttribute('VALUE', p[3] + p[4] + p[5]) |
+ p[0] = self.BuildNamed('ExtAttribute', p, 1, value) |
+ |
+ # [b76.2] A&B&C |
+ def p_IdentAndList(self, p): |
+ """IdentAndList : identifier '&' IdentAndList |
+ | identifier""" |
+ if len(p) > 3: |
+ p[0] = p[1] + p[2] + p[3] |
+ else: |
+ p[0] = p[1] |
+ |
+ # [b76.3] A|B|C |
+ def p_IdentOrList(self, p): |
+ """IdentOrList : identifier '|' IdentOrList |
+ | identifier""" |
+ if len(p) > 3: |
+ p[0] = p[1] + p[2] + p[3] |
+ else: |
+ p[0] = p[1] |
+ |
+ # Blink extension: Add support for compound Extended Attribute values over string literals ("A"|"B") |
+ def p_ExtendedAttributeStringLiteralList(self, p): |
+ """ExtendedAttributeStringLiteralList : identifier '=' StringLiteralOrList""" |
+ value = self.BuildAttribute('VALUE', p[3]) |
+ p[0] = self.BuildNamed('ExtAttribute', p, 1, value) |
+ |
+ # Blink extension: one or more string literals. The values aren't propagated as literals, |
+ # but their by their value only. |
+ def p_StringLiteralOrList(self, p): |
+ """StringLiteralOrList : StringLiteral '|' StringLiteralOrList |
+ | StringLiteral""" |
+ def unwrap_string(ls): |
+ """Reach in and grab the string literal's "NAME".""" |
+ return ls[1].value |
+ |
+ if len(p) > 3: |
+ p[0] = unwrap_string(p[1]) + p[2] + p[3] |
+ else: |
+ p[0] = unwrap_string(p[1]) |
+ |
+ def __init__(self, |
+ # common parameters |
+ debug=False, |
+ # idl_parser parameters |
+ lexer=None, verbose=False, mute_error=False, |
+ # yacc parameters |
+ outputdir='', optimize=True, write_tables=False, |
+ picklefile=None): |
+ if debug: |
+ # Turn off optimization and caching, and write out tables, |
+ # to help debugging |
+ optimize = False |
+ outputdir = None |
+ picklefile = None |
+ write_tables = True |
+ if outputdir: |
+ picklefile = picklefile or os.path.join(outputdir, 'parsetab.pickle') |
+ |
+ lexer = lexer or BlinkIDLLexer(debug=debug, |
+ outputdir=outputdir, |
+ optimize=optimize) |
+ self.lexer = lexer |
+ self.tokens = lexer.KnownTokens() |
+ # Using SLR (instead of LALR) generates the table faster, |
+ # but produces the same output. This is ok b/c Web IDL (and Blink IDL) |
+ # is an SLR grammar (as is often the case for simple LL(1) grammars). |
+ # |
+ # Optimized mode substantially decreases startup time (by disabling |
+ # error checking), and also allows use of Python's optimized mode. |
+ # See: Using Python's Optimized Mode |
+ # http://www.dabeaz.com/ply/ply.html#ply_nn38 |
+ # |
+ # |picklefile| allows simpler importing than |tabmodule| (parsetab.py), |
+ # as we don't need to modify sys.path; virtually identical speed. |
+ # See: CHANGES, Version 3.2 |
+ # http://ply.googlecode.com/svn/trunk/CHANGES |
+ self.yaccobj = yacc.yacc(module=self, |
+ start=STARTING_SYMBOL, |
+ method='SLR', |
+ debug=debug, |
+ optimize=optimize, |
+ write_tables=write_tables, |
+ picklefile=picklefile) |
+ self.parse_debug = debug |
+ self.verbose = verbose |
+ self.mute_error = mute_error |
+ self._parse_errors = 0 |
+ self._parse_warnings = 0 |
+ self._last_error_msg = None |
+ self._last_error_lineno = 0 |
+ self._last_error_pos = 0 |
+ |
+ |
+################################################################################ |
+ |
+def main(argv): |
+ # If file itself executed, cache parse table |
+ try: |
+ outputdir = argv[1] |
+ except IndexError as err: |
+ print 'Usage: %s OUTPUT_DIR' % argv[0] |
+ return 1 |
+ parser = BlinkIDLParser(outputdir=outputdir) |
+ |
+ |
+if __name__ == '__main__': |
+ sys.exit(main(sys.argv)) |