mojom/mojom_parser/lexer/tokens.go - Issue 1387893002: New lexer for mojom written in go.

Unified Diff: mojom/mojom_parser/lexer/tokens.go

Issue 1387893002: New lexer for mojom written in go. (Closed) Base URL: https://github.com/domokit/mojo.git@master

Patch Set: Created 5 years, 2 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Index: mojom/mojom_parser/lexer/tokens.go

diff --git a/mojom/mojom_parser/lexer/tokens.go b/mojom/mojom_parser/lexer/tokens.go

new file mode 100644

index 0000000000000000000000000000000000000000..77a05ba7068cdc9281326f06bf482cecf2b924f8

--- /dev/null

+++ b/mojom/mojom_parser/lexer/tokens.go

@@ -0,0 +1,210 @@

+// Use of this source code is governed by a BSD-style license that can be

+// found in the LICENSE file.

+//

+// TokenKinds is a type which describes the kinds of tokens which can be

+// encountered in a mojom file.

+package lexer

+import (

+ "fmt"

+type TokenKind int

+// TokenKinds

+const (

+ // An error of an unknown nature has occured.

+ ERROR_UNKNOWN TokenKind = iota

mattr 2015/10/12 18:04:13 The convention in go is to use camel case even for

azani 2015/10/13 00:23:46 Done.

+ // A character was found which is not part of a valid token.

+ ERROR_ILLEGAL_CHAR

+ // A quoted string was opened but not closed.

+ ERROR_UNTERMINATED_STRING_LITERAL

+ // A multiline comment was opened but not closed.

+ ERROR_UNTERMINATED_COMMENT

+ // Indicates the end of a stream of tokens.

+ EOF

+ // Punctuators and Separators

+ LPAREN

+ RPAREN

+ LBRACKET

+ RBRACKET

+ LBRACE

+ RBRACE

+ LANGLE

+ RANGLE

+ SEMI

+ COMMA

+ DOT

+ MINUS

+ PLUS

+ AMP

+ QSTN

+ EQUALS

+ RESPONSE

+ // Names

+ NAME

+ // Keywords

+ IMPORT

+ MODULE

+ STRUCT

+ UNION

+ INTERFACE

+ ENUM

+ CONST

+ TRUE

+ FALSE

+ DEFAULT

+ // Constants

+ INT_CONST_DEC

+ INT_CONST_HEX

+ FLOAT_CONST

+ ORDINAL

+ STRING_LITERAL

+// This method is used to generate user-facing strings in compilation error

+// messages. For example for LBRACE we produce the string "'{'". Notice the

+// single-quotes. This will be used for example in an error message that looks

+// like the following:

+// Unexpected token at line 5, column 6: '###'. Expecting '{'.

+func (tokenKind TokenKind) String() string {

+ switch tokenKind {

+ // Errors

+ case ERROR_UNKNOWN:

+ return "unknown token"

+ case ERROR_ILLEGAL_CHAR:

+ return "illegal token"

+ case ERROR_UNTERMINATED_STRING_LITERAL:

+ return "unterminated string literal"

+ case ERROR_UNTERMINATED_COMMENT:

+ return "unterminated comment"

+ // Punctuators and Separators

+ case LPAREN:

+ return "'('"

+ case RPAREN:

+ return "')'"

+ case LBRACKET:

+ return "'['"

+ case RBRACKET:

+ return "']'"

+ case LBRACE:

+ return "'{'"

+ case RBRACE:

+ return "'}'"

+ case LANGLE:

+ return "'<'"

+ case RANGLE:

+ return "'>'"

+ case SEMI:

+ return "';'"

+ case COMMA:

+ return "','"

+ case DOT:

+ return "'.'"

+ case MINUS:

+ return "'-'"

+ case PLUS:

+ return "'+'"

+ case AMP:

+ return "'&'"

+ case QSTN:

+ return "'?'"

+ case EQUALS:

+ return "'='"

+ case RESPONSE:

+ return "'=>'"

+ // Names

+ case NAME:

+ return "a name"

+ // Keywords

+ case IMPORT:

+ return "'import'"

+ case MODULE:

+ return "'module'"

+ case STRUCT:

+ return "'struct'"

+ case UNION:

+ return "'union'"

+ case INTERFACE:

+ return "'interface'"

+ case ENUM:

+ return "'enum'"

+ case CONST:

+ return "'const'"

+ case TRUE:

+ return "'true'"

+ case FALSE:

+ return "'false'"

+ case DEFAULT:

+ return "'default'"

+ // Constants

+ case INT_CONST_DEC:

+ return "decimal integer literal"

+ case INT_CONST_HEX:

+ return "hex integer literal"

+ case FLOAT_CONST:

+ return "float literal"

+ case ORDINAL:

+ return "an ordinal"

+ case STRING_LITERAL:

+ return "a string literal"

+ default:

+ // Note(rudominer) It is important to use %d below so as to avoid

+ // re-invoking this method and causing an infinite recursion.

+ return fmt.Sprintf("%d", tokenKind)

+ }

+type Token struct {

+ Kind TokenKind

+ Text string

+ CharPos int // Position in the source string.

+ LineNo int // First line is 0.

+ LinePos int // Position in the line. First char in line is 0.

+// This method is used to generate user-facing strings in compilation error

mattr 2015/10/12 18:04:13 The usual Go convention is to start all comments w

azani 2015/10/13 00:23:46 Done.

+// messages. This will be used for example in an error message that looks

+// like the following:

+// Unexpected token at line 5, column 6: '###'. Expecting '{'.

+func (t Token) ShortLocationString() string {

+ return fmt.Sprintf("%d,%d", t.LineNo+1, t.LinePos+1)

+func (t Token) LongLocationString() string {

+ return fmt.Sprintf("line %d, column %d", t.LineNo+1, t.LinePos+1)

+// Is this the EOF token that represent the end of the token stream?

+func (t Token) EOF() bool {

+ return t.Kind == EOF

+// This method is used to generate user-facing strings in compilation error

+// messages. For many token kinds the TokenKind.String() method will produce

+// good results for representing the token. But for other TokenKinds we will

+// want to include some information besides a representation of the kind.

+// For example for an ERROR_UNKNOWN kind we wnat to show the text.

+// This will be used for example in an error message that looks

+// like the following:

+// Unexpected token at line 5, column 6: '###'. Expecting '{'.

+func (token Token) String() string {

+ switch token.Kind {

+ case ERROR_UNKNOWN, NAME, STRING_LITERAL, INT_CONST_DEC, INT_CONST_HEX, FLOAT_CONST, ORDINAL:

+ return fmt.Sprintf("'%s'", token.Text)

+ default:

+ return token.Kind.String()

+ }

« mojom/mojom_parser/lexer/token_stream.go ('K') | « mojom/mojom_parser/lexer/token_stream.go ('k') | no next file » | no next file with comments »