tools/gn/tokenizer.h - Issue 21114002: Add initial prototype for the GN meta-buildsystem.

Unified Diff: tools/gn/tokenizer.h

Issue 21114002: Add initial prototype for the GN meta-buildsystem. (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src

Patch Set: add owners and readme Created 7 years, 5 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: tools/gn/tokenizer.h

diff --git a/tools/gn/tokenizer.h b/tools/gn/tokenizer.h

new file mode 100644

index 0000000000000000000000000000000000000000..5e0016919f20f72ee470c01b0ec3c33298ad9c07

--- /dev/null

+++ b/tools/gn/tokenizer.h

@@ -0,0 +1,86 @@

+// Use of this source code is governed by a BSD-style license that can be

+// found in the LICENSE file.

+#ifndef TOOLS_GN_TOKENIZER_H_

+#define TOOLS_GN_TOKENIZER_H_

+#include <vector>

+#include "base/basictypes.h"

+#include "base/strings/string_piece.h"

+#include "tools/gn/err.h"

+#include "tools/gn/token.h"

+class InputFile;

+class Tokenizer {

+ public:

+ static std::vector<Token> Tokenize(const InputFile* input_file, Err* err);

+ // Counts lines in the given buffer (the first line is "1") and returns

+ // the byte offset of the beginning of that line, or (size_t)-1 if there

+ // aren't that many lines in the file. Note that this will return the byte

+ // one past the end of the input if the last character is a newline.

+ //

+ // This is a helper function for error output so that the tokenizer's

+ // notion of lines can be used elsewhere.

+ static size_t ByteOffsetOfNthLine(const base::StringPiece& buf, int n);

+ // Returns true if the given offset of the string piece counts as a newline.

+ // The offset must be in the buffer.

+ static bool IsNewline(const base::StringPiece& buffer, size_t offset);

+ static bool IsIdentifierFirstChar(char c) {

+ return (c >= 'A' && c <= 'Z') || (c >= 'a' && c <= 'z') || c == '_';

+ }

+ static bool IsIdentifierContinuingChar(char c) {

+ // Also allow digits after the first char.

+ return IsIdentifierFirstChar(c) || (c >= '0' && c <= '9');

+ }

+ private:

+ // InputFile must outlive the tokenizer and all generated tokens.

+ explicit Tokenizer(const InputFile* input_file, Err* err);

+ ~Tokenizer();

+ std::vector<Token> Run();

+ void AdvanceToNextToken();

+ Token::Type ClassifyCurrent() const;

+ void AdvanceToEndOfToken(const Location& location, Token::Type type);

+ bool IsCurrentWhitespace() const;

+ bool IsCurrentNewline() const;

+ bool IsCurrentStringTerminator(char quote_char) const;

+ bool CanIncrement() const { return cur_ < input_.size(); }

+ // Increments the current location by one.

+ void Advance();

+ // Returns the current character in the file as a location.

+ Location GetCurrentLocation() const;

+ Err GetErrorForInvalidToken(const Location& location) const;

+ bool done() const { return at_end() || has_error(); }

+ bool at_end() const { return cur_ == input_.size(); }

+ char cur_char() const { return input_[cur_]; }

+ bool has_error() const { return err_->has_error(); }

+ const InputFile* input_file_;

+ const base::StringPiece input_;

+ Err* err_;

+ size_t cur_; // Byte offset into input buffer.

+ int line_number_;

+ int char_in_line_;

+ DISALLOW_COPY_AND_ASSIGN(Tokenizer);

+};

+#endif // TOOLS_GN_TOKENIZER_H_

« no previous file with comments | « tools/gn/token.cc ('k') | tools/gn/tokenizer.cc » ('j') | no next file with comments »