third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java - Issue 1842653006: Update //third_party/protobuf to version 3.

Unified Diff: third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java

Issue 1842653006: Update //third_party/protobuf to version 3. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: merge Created 4 years, 8 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« no previous file with comments | « third_party/protobuf/java/src/main/java/com/google/protobuf/SmallSortedMap.java ('k') | third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormatEscaper.java » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java

diff --git a/third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java b/third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java

new file mode 100644

index 0000000000000000000000000000000000000000..c99b52851291e67fc2a1c2ef57a238d3dc47285c

--- /dev/null

+++ b/third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java

@@ -0,0 +1,2065 @@

+// Protocol Buffers - Google's data interchange format

+// https://developers.google.com/protocol-buffers/

+//

+// Redistribution and use in source and binary forms, with or without

+// modification, are permitted provided that the following conditions are

+// met:

+//

+// * Redistributions of source code must retain the above copyright

+// notice, this list of conditions and the following disclaimer.

+// * Redistributions in binary form must reproduce the above

+// copyright notice, this list of conditions and the following disclaimer

+// in the documentation and/or other materials provided with the

+// distribution.

+// * Neither the name of Google Inc. nor the names of its

+// contributors may be used to endorse or promote products derived from

+// this software without specific prior written permission.

+//

+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

+// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

+// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR

+// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT

+// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

+// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT

+// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

+// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

+// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

+// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

+package com.google.protobuf;

+import com.google.protobuf.Descriptors.Descriptor;

+import com.google.protobuf.Descriptors.EnumDescriptor;

+import com.google.protobuf.Descriptors.EnumValueDescriptor;

+import com.google.protobuf.Descriptors.FieldDescriptor;

+import java.io.IOException;

+import java.math.BigInteger;

+import java.nio.CharBuffer;

+import java.util.ArrayList;

+import java.util.List;

+import java.util.Locale;

+import java.util.Map;

+import java.util.logging.Logger;

+import java.util.regex.Matcher;

+import java.util.regex.Pattern;

+/**

+ * Provide text parsing and formatting support for proto2 instances.

+ * The implementation largely follows google/protobuf/text_format.cc.

+ *

+ * @author wenboz@google.com Wenbo Zhu

+ * @author kenton@google.com Kenton Varda

+ */

+public final class TextFormat {

+ private TextFormat() {}

+ private static final Logger logger =

+ Logger.getLogger(TextFormat.class.getName());

+ private static final Printer DEFAULT_PRINTER = new Printer();

+ private static final Printer SINGLE_LINE_PRINTER =

+ (new Printer()).setSingleLineMode(true);

+ private static final Printer UNICODE_PRINTER =

+ (new Printer()).setEscapeNonAscii(false);

+ /**

+ * Outputs a textual representation of the Protocol Message supplied into

+ * the parameter output. (This representation is the new version of the

+ * classic "ProtocolPrinter" output from the original Protocol Buffer system)

+ */

+ public static void print(

+ final MessageOrBuilder message, final Appendable output)

+ throws IOException {

+ DEFAULT_PRINTER.print(message, new TextGenerator(output));

+ }

+ /** Outputs a textual representation of {@code fields} to {@code output}. */

+ public static void print(final UnknownFieldSet fields,

+ final Appendable output)

+ throws IOException {

+ DEFAULT_PRINTER.printUnknownFields(fields, new TextGenerator(output));

+ }

+ /**

+ * Same as {@code print()}, except that non-ASCII characters are not

+ * escaped.

+ */

+ public static void printUnicode(

+ final MessageOrBuilder message, final Appendable output)

+ throws IOException {

+ UNICODE_PRINTER.print(message, new TextGenerator(output));

+ }

+ /**

+ * Same as {@code print()}, except that non-ASCII characters are not

+ * escaped.

+ */

+ public static void printUnicode(final UnknownFieldSet fields,

+ final Appendable output)

+ throws IOException {

+ UNICODE_PRINTER.printUnknownFields(fields, new TextGenerator(output));

+ }

+ /**

+ * Generates a human readable form of this message, useful for debugging and

+ * other purposes, with no newline characters.

+ */

+ public static String shortDebugString(final MessageOrBuilder message) {

+ try {

+ final StringBuilder sb = new StringBuilder();

+ SINGLE_LINE_PRINTER.print(message, new TextGenerator(sb));

+ // Single line mode currently might have an extra space at the end.

+ return sb.toString().trim();

+ } catch (IOException e) {

+ throw new IllegalStateException(e);

+ }

+ /**

+ * Generates a human readable form of the field, useful for debugging

+ * and other purposes, with no newline characters.

+ */

+ public static String shortDebugString(final FieldDescriptor field,

+ final Object value) {

+ try {

+ final StringBuilder sb = new StringBuilder();

+ SINGLE_LINE_PRINTER.printField(field, value, new TextGenerator(sb));

+ return sb.toString().trim();

+ } catch (IOException e) {

+ throw new IllegalStateException(e);

+ }

+ /**

+ * Generates a human readable form of the unknown fields, useful for debugging

+ * and other purposes, with no newline characters.

+ */

+ public static String shortDebugString(final UnknownFieldSet fields) {

+ try {

+ final StringBuilder sb = new StringBuilder();

+ SINGLE_LINE_PRINTER.printUnknownFields(fields, new TextGenerator(sb));

+ // Single line mode currently might have an extra space at the end.

+ return sb.toString().trim();

+ } catch (IOException e) {

+ throw new IllegalStateException(e);

+ }

+ /**

+ * Like {@code print()}, but writes directly to a {@code String} and

+ * returns it.

+ */

+ public static String printToString(final MessageOrBuilder message) {

+ try {

+ final StringBuilder text = new StringBuilder();

+ print(message, text);

+ return text.toString();

+ } catch (IOException e) {

+ throw new IllegalStateException(e);

+ }

+ /**

+ * Like {@code print()}, but writes directly to a {@code String} and

+ * returns it.

+ */

+ public static String printToString(final UnknownFieldSet fields) {

+ try {

+ final StringBuilder text = new StringBuilder();

+ print(fields, text);

+ return text.toString();

+ } catch (IOException e) {

+ throw new IllegalStateException(e);

+ }

+ /**

+ * Same as {@code printToString()}, except that non-ASCII characters

+ * in string type fields are not escaped in backslash+octals.

+ */

+ public static String printToUnicodeString(final MessageOrBuilder message) {

+ try {

+ final StringBuilder text = new StringBuilder();

+ UNICODE_PRINTER.print(message, new TextGenerator(text));

+ return text.toString();

+ } catch (IOException e) {

+ throw new IllegalStateException(e);

+ }

+ /**

+ * Same as {@code printToString()}, except that non-ASCII characters

+ * in string type fields are not escaped in backslash+octals.

+ */

+ public static String printToUnicodeString(final UnknownFieldSet fields) {

+ try {

+ final StringBuilder text = new StringBuilder();

+ UNICODE_PRINTER.printUnknownFields(fields, new TextGenerator(text));

+ return text.toString();

+ } catch (IOException e) {

+ throw new IllegalStateException(e);

+ }

+ public static void printField(final FieldDescriptor field,

+ final Object value,

+ final Appendable output)

+ throws IOException {

+ DEFAULT_PRINTER.printField(field, value, new TextGenerator(output));

+ }

+ public static String printFieldToString(final FieldDescriptor field,

+ final Object value) {

+ try {

+ final StringBuilder text = new StringBuilder();

+ printField(field, value, text);

+ return text.toString();

+ } catch (IOException e) {

+ throw new IllegalStateException(e);

+ }

+ /**

+ * Outputs a textual representation of the value of given field value.

+ *

+ * @param field the descriptor of the field

+ * @param value the value of the field

+ * @param output the output to which to append the formatted value

+ * @throws ClassCastException if the value is not appropriate for the

+ * given field descriptor

+ * @throws IOException if there is an exception writing to the output

+ */

+ public static void printFieldValue(final FieldDescriptor field,

+ final Object value,

+ final Appendable output)

+ throws IOException {

+ DEFAULT_PRINTER.printFieldValue(field, value, new TextGenerator(output));

+ }

+ /**

+ * Outputs a textual representation of the value of an unknown field.

+ *

+ * @param tag the field's tag number

+ * @param value the value of the field

+ * @param output the output to which to append the formatted value

+ * @throws ClassCastException if the value is not appropriate for the

+ * given field descriptor

+ * @throws IOException if there is an exception writing to the output

+ */

+ public static void printUnknownFieldValue(final int tag,

+ final Object value,

+ final Appendable output)

+ throws IOException {

+ printUnknownFieldValue(tag, value, new TextGenerator(output));

+ }

+ private static void printUnknownFieldValue(final int tag,

+ final Object value,

+ final TextGenerator generator)

+ throws IOException {

+ switch (WireFormat.getTagWireType(tag)) {

+ case WireFormat.WIRETYPE_VARINT:

+ generator.print(unsignedToString((Long) value));

+ break;

+ case WireFormat.WIRETYPE_FIXED32:

+ generator.print(

+ String.format((Locale) null, "0x%08x", (Integer) value));

+ break;

+ case WireFormat.WIRETYPE_FIXED64:

+ generator.print(String.format((Locale) null, "0x%016x", (Long) value));

+ break;

+ case WireFormat.WIRETYPE_LENGTH_DELIMITED:

+ generator.print("\"");

+ generator.print(escapeBytes((ByteString) value));

+ generator.print("\"");

+ break;

+ case WireFormat.WIRETYPE_START_GROUP:

+ DEFAULT_PRINTER.printUnknownFields((UnknownFieldSet) value, generator);

+ break;

+ default:

+ throw new IllegalArgumentException("Bad tag: " + tag);

+ }

+ /** Helper class for converting protobufs to text. */

+ private static final class Printer {

+ /** Whether to omit newlines from the output. */

+ boolean singleLineMode = false;

+ /** Whether to escape non ASCII characters with backslash and octal. */

+ boolean escapeNonAscii = true;

+ private Printer() {}

+ /** Setter of singleLineMode */

+ private Printer setSingleLineMode(boolean singleLineMode) {

+ this.singleLineMode = singleLineMode;

+ return this;

+ }

+ /** Setter of escapeNonAscii */

+ private Printer setEscapeNonAscii(boolean escapeNonAscii) {

+ this.escapeNonAscii = escapeNonAscii;

+ return this;

+ }

+ private void print(

+ final MessageOrBuilder message, final TextGenerator generator)

+ throws IOException {

+ for (Map.Entry<FieldDescriptor, Object> field

+ : message.getAllFields().entrySet()) {

+ printField(field.getKey(), field.getValue(), generator);

+ }

+ printUnknownFields(message.getUnknownFields(), generator);

+ }

+ private void printField(final FieldDescriptor field, final Object value,

+ final TextGenerator generator) throws IOException {

+ if (field.isRepeated()) {

+ // Repeated field. Print each element.

+ for (Object element : (List<?>) value) {

+ printSingleField(field, element, generator);

+ }

+ } else {

+ printSingleField(field, value, generator);

+ }

+ private void printSingleField(final FieldDescriptor field,

+ final Object value,

+ final TextGenerator generator)

+ throws IOException {

+ if (field.isExtension()) {

+ generator.print("[");

+ // We special-case MessageSet elements for compatibility with proto1.

+ if (field.getContainingType().getOptions().getMessageSetWireFormat()

+ && (field.getType() == FieldDescriptor.Type.MESSAGE)

+ && (field.isOptional())

+ // object equality

+ && (field.getExtensionScope() == field.getMessageType())) {

+ generator.print(field.getMessageType().getFullName());

+ } else {

+ generator.print(field.getFullName());

+ }

+ generator.print("]");

+ } else {

+ if (field.getType() == FieldDescriptor.Type.GROUP) {

+ // Groups must be serialized with their original capitalization.

+ generator.print(field.getMessageType().getName());

+ } else {

+ generator.print(field.getName());

+ }

+ if (field.getJavaType() == FieldDescriptor.JavaType.MESSAGE) {

+ if (singleLineMode) {

+ generator.print(" { ");

+ } else {

+ generator.print(" {\n");

+ generator.indent();

+ }

+ } else {

+ generator.print(": ");

+ }

+ printFieldValue(field, value, generator);

+ if (field.getJavaType() == FieldDescriptor.JavaType.MESSAGE) {

+ if (singleLineMode) {

+ generator.print("} ");

+ } else {

+ generator.outdent();

+ generator.print("}\n");

+ }

+ } else {

+ if (singleLineMode) {

+ generator.print(" ");

+ } else {

+ generator.print("\n");

+ }

+ private void printFieldValue(final FieldDescriptor field,

+ final Object value,

+ final TextGenerator generator)

+ throws IOException {

+ switch (field.getType()) {

+ case INT32:

+ case SINT32:

+ case SFIXED32:

+ generator.print(((Integer) value).toString());

+ break;

+ case INT64:

+ case SINT64:

+ case SFIXED64:

+ generator.print(((Long) value).toString());

+ break;

+ case BOOL:

+ generator.print(((Boolean) value).toString());

+ break;

+ case FLOAT:

+ generator.print(((Float) value).toString());

+ break;

+ case DOUBLE:

+ generator.print(((Double) value).toString());

+ break;

+ case UINT32:

+ case FIXED32:

+ generator.print(unsignedToString((Integer) value));

+ break;

+ case UINT64:

+ case FIXED64:

+ generator.print(unsignedToString((Long) value));

+ break;

+ case STRING:

+ generator.print("\"");

+ generator.print(escapeNonAscii

+ ? escapeText((String) value)

+ : escapeDoubleQuotesAndBackslashes((String) value)

+ .replace("\n", "\\n"));

+ generator.print("\"");

+ break;

+ case BYTES:

+ generator.print("\"");

+ if (value instanceof ByteString) {

+ generator.print(escapeBytes((ByteString) value));

+ } else {

+ generator.print(escapeBytes((byte[]) value));

+ }

+ generator.print("\"");

+ break;

+ case ENUM:

+ generator.print(((EnumValueDescriptor) value).getName());

+ break;

+ case MESSAGE:

+ case GROUP:

+ print((Message) value, generator);

+ break;

+ }

+ private void printUnknownFields(final UnknownFieldSet unknownFields,

+ final TextGenerator generator)

+ throws IOException {

+ for (Map.Entry<Integer, UnknownFieldSet.Field> entry :

+ unknownFields.asMap().entrySet()) {

+ final int number = entry.getKey();

+ final UnknownFieldSet.Field field = entry.getValue();

+ printUnknownField(number, WireFormat.WIRETYPE_VARINT,

+ field.getVarintList(), generator);

+ printUnknownField(number, WireFormat.WIRETYPE_FIXED32,

+ field.getFixed32List(), generator);

+ printUnknownField(number, WireFormat.WIRETYPE_FIXED64,

+ field.getFixed64List(), generator);

+ printUnknownField(number, WireFormat.WIRETYPE_LENGTH_DELIMITED,

+ field.getLengthDelimitedList(), generator);

+ for (final UnknownFieldSet value : field.getGroupList()) {

+ generator.print(entry.getKey().toString());

+ if (singleLineMode) {

+ generator.print(" { ");

+ } else {

+ generator.print(" {\n");

+ generator.indent();

+ }

+ printUnknownFields(value, generator);

+ if (singleLineMode) {

+ generator.print("} ");

+ } else {

+ generator.outdent();

+ generator.print("}\n");

+ }

+ private void printUnknownField(final int number,

+ final int wireType,

+ final List<?> values,

+ final TextGenerator generator)

+ throws IOException {

+ for (final Object value : values) {

+ generator.print(String.valueOf(number));

+ generator.print(": ");

+ printUnknownFieldValue(wireType, value, generator);

+ generator.print(singleLineMode ? " " : "\n");

+ }

+ /** Convert an unsigned 32-bit integer to a string. */

+ public static String unsignedToString(final int value) {

+ if (value >= 0) {

+ return Integer.toString(value);

+ } else {

+ return Long.toString(value & 0x00000000FFFFFFFFL);

+ }

+ /** Convert an unsigned 64-bit integer to a string. */

+ public static String unsignedToString(final long value) {

+ if (value >= 0) {

+ return Long.toString(value);

+ } else {

+ // Pull off the most-significant bit so that BigInteger doesn't think

+ // the number is negative, then set it again using setBit().

+ return BigInteger.valueOf(value & 0x7FFFFFFFFFFFFFFFL)

+ .setBit(63).toString();

+ }

+ /**

+ * An inner class for writing text to the output stream.

+ */

+ private static final class TextGenerator {

+ private final Appendable output;

+ private final StringBuilder indent = new StringBuilder();

+ private boolean atStartOfLine = true;

+ private TextGenerator(final Appendable output) {

+ this.output = output;

+ }

+ /**

+ * Indent text by two spaces. After calling Indent(), two spaces will be

+ * inserted at the beginning of each line of text. Indent() may be called

+ * multiple times to produce deeper indents.

+ */

+ public void indent() {

+ indent.append(" ");

+ }

+ /**

+ * Reduces the current indent level by two spaces, or crashes if the indent

+ * level is zero.

+ */

+ public void outdent() {

+ final int length = indent.length();

+ if (length == 0) {

+ throw new IllegalArgumentException(

+ " Outdent() without matching Indent().");

+ }

+ indent.delete(length - 2, length);

+ }

+ /**

+ * Print text to the output stream.

+ */

+ public void print(final CharSequence text) throws IOException {

+ final int size = text.length();

+ int pos = 0;

+ for (int i = 0; i < size; i++) {

+ if (text.charAt(i) == '\n') {

+ write(text.subSequence(pos, i + 1));

+ pos = i + 1;

+ atStartOfLine = true;

+ }

+ write(text.subSequence(pos, size));

+ }

+ private void write(final CharSequence data) throws IOException {

+ if (data.length() == 0) {

+ return;

+ }

+ if (atStartOfLine) {

+ atStartOfLine = false;

+ output.append(indent);

+ }

+ output.append(data);

+ }

+ // =================================================================

+ // Parsing

+ /**

+ * Represents a stream of tokens parsed from a {@code String}.

+ *

+ * <p>The Java standard library provides many classes that you might think

+ * would be useful for implementing this, but aren't. For example:

+ *

+ * <ul>

+ * <li>{@code java.io.StreamTokenizer}: This almost does what we want -- or,

+ * at least, something that would get us close to what we want -- except

+ * for one fatal flaw: It automatically un-escapes strings using Java

+ * escape sequences, which do not include all the escape sequences we

+ * need to support (e.g. '\x').

+ * <li>{@code java.util.Scanner}: This seems like a great way at least to

+ * parse regular expressions out of a stream (so we wouldn't have to load

+ * the entire input into a single string before parsing). Sadly,

+ * {@code Scanner} requires that tokens be delimited with some delimiter.

+ * Thus, although the text "foo:" should parse to two tokens ("foo" and

+ * ":"), {@code Scanner} would recognize it only as a single token.

+ * Furthermore, {@code Scanner} provides no way to inspect the contents

+ * of delimiters, making it impossible to keep track of line and column

+ * numbers.

+ * </ul>

+ *

+ * <p>Luckily, Java's regular expression support does manage to be useful to

+ * us. (Barely: We need {@code Matcher.usePattern()}, which is new in

+ * Java 1.5.) So, we can use that, at least. Unfortunately, this implies

+ * that we need to have the entire input in one contiguous string.

+ */

+ private static final class Tokenizer {

+ private final CharSequence text;

+ private final Matcher matcher;

+ private String currentToken;

+ // The character index within this.text at which the current token begins.

+ private int pos = 0;

+ // The line and column numbers of the current token.

+ private int line = 0;

+ private int column = 0;

+ // The line and column numbers of the previous token (allows throwing

+ // errors *after* consuming).

+ private int previousLine = 0;

+ private int previousColumn = 0;

+ // We use possessive quantifiers (*+ and ++) because otherwise the Java

+ // regex matcher has stack overflows on large inputs.

+ private static final Pattern WHITESPACE =

+ Pattern.compile("(\\s|(#.*$))++", Pattern.MULTILINE);

+ private static final Pattern TOKEN = Pattern.compile(

+ "[a-zA-Z_][0-9a-zA-Z_+-]*+|" + // an identifier

+ "[.]?[0-9+-][0-9a-zA-Z_.+-]*+|" + // a number

+ "\"([^\"\n\\\\]|\\\\.)*+(\"|\\\\?$)|" + // a double-quoted string

+ "\'([^\'\n\\\\]|\\\\.)*+(\'|\\\\?$)", // a single-quoted string

+ Pattern.MULTILINE);

+ private static final Pattern DOUBLE_INFINITY = Pattern.compile(

+ "-?inf(inity)?",

+ Pattern.CASE_INSENSITIVE);

+ private static final Pattern FLOAT_INFINITY = Pattern.compile(

+ "-?inf(inity)?f?",

+ Pattern.CASE_INSENSITIVE);

+ private static final Pattern FLOAT_NAN = Pattern.compile(

+ "nanf?",

+ Pattern.CASE_INSENSITIVE);

+ /** Construct a tokenizer that parses tokens from the given text. */

+ private Tokenizer(final CharSequence text) {

+ this.text = text;

+ this.matcher = WHITESPACE.matcher(text);

+ skipWhitespace();

+ nextToken();

+ }

+ /** Are we at the end of the input? */

+ public boolean atEnd() {

+ return currentToken.length() == 0;

+ }

+ /** Advance to the next token. */

+ public void nextToken() {

+ previousLine = line;

+ previousColumn = column;

+ // Advance the line counter to the current position.

+ while (pos < matcher.regionStart()) {

+ if (text.charAt(pos) == '\n') {

+ ++line;

+ column = 0;

+ } else {

+ ++column;

+ }

+ ++pos;

+ }

+ // Match the next token.

+ if (matcher.regionStart() == matcher.regionEnd()) {

+ // EOF

+ currentToken = "";

+ } else {

+ matcher.usePattern(TOKEN);

+ if (matcher.lookingAt()) {

+ currentToken = matcher.group();

+ matcher.region(matcher.end(), matcher.regionEnd());

+ } else {

+ // Take one character.

+ currentToken = String.valueOf(text.charAt(pos));

+ matcher.region(pos + 1, matcher.regionEnd());

+ }

+ skipWhitespace();

+ }

+ /**

+ * Skip over any whitespace so that the matcher region starts at the next

+ * token.

+ */

+ private void skipWhitespace() {

+ matcher.usePattern(WHITESPACE);

+ if (matcher.lookingAt()) {

+ matcher.region(matcher.end(), matcher.regionEnd());

+ }

+ /**

+ * If the next token exactly matches {@code token}, consume it and return

+ * {@code true}. Otherwise, return {@code false} without doing anything.

+ */

+ public boolean tryConsume(final String token) {

+ if (currentToken.equals(token)) {

+ nextToken();

+ return true;

+ } else {

+ return false;

+ }

+ /**

+ * If the next token exactly matches {@code token}, consume it. Otherwise,

+ * throw a {@link ParseException}.

+ */

+ public void consume(final String token) throws ParseException {

+ if (!tryConsume(token)) {

+ throw parseException("Expected \"" + token + "\".");

+ }

+ /**

+ * Returns {@code true} if the next token is an integer, but does

+ * not consume it.

+ */

+ public boolean lookingAtInteger() {

+ if (currentToken.length() == 0) {

+ return false;

+ }

+ final char c = currentToken.charAt(0);

+ return ('0' <= c && c <= '9')

+ || c == '-' || c == '+';

+ }

+ /**

+ * Returns {@code true} if the current token's text is equal to that

+ * specified.

+ */

+ public boolean lookingAt(String text) {

+ return currentToken.equals(text);

+ }

+ /**

+ * If the next token is an identifier, consume it and return its value.

+ * Otherwise, throw a {@link ParseException}.

+ */

+ public String consumeIdentifier() throws ParseException {

+ for (int i = 0; i < currentToken.length(); i++) {

+ final char c = currentToken.charAt(i);

+ if (('a' <= c && c <= 'z')

+ || ('A' <= c && c <= 'Z')

+ || ('0' <= c && c <= '9')

+ || (c == '_') || (c == '.')) {

+ // OK

+ } else {

+ throw parseException(

+ "Expected identifier. Found '" + currentToken + "'");

+ }

+ final String result = currentToken;

+ nextToken();

+ return result;

+ }

+ /**

+ * If the next token is an identifier, consume it and return {@code true}.

+ * Otherwise, return {@code false} without doing anything.

+ */

+ public boolean tryConsumeIdentifier() {

+ try {

+ consumeIdentifier();

+ return true;

+ } catch (ParseException e) {

+ return false;

+ }

+ /**

+ * If the next token is a 32-bit signed integer, consume it and return its

+ * value. Otherwise, throw a {@link ParseException}.

+ */

+ public int consumeInt32() throws ParseException {

+ try {

+ final int result = parseInt32(currentToken);

+ nextToken();

+ return result;

+ } catch (NumberFormatException e) {

+ throw integerParseException(e);

+ }

+ /**

+ * If the next token is a 32-bit unsigned integer, consume it and return its

+ * value. Otherwise, throw a {@link ParseException}.

+ */

+ public int consumeUInt32() throws ParseException {

+ try {

+ final int result = parseUInt32(currentToken);

+ nextToken();

+ return result;

+ } catch (NumberFormatException e) {

+ throw integerParseException(e);

+ }

+ /**

+ * If the next token is a 64-bit signed integer, consume it and return its

+ * value. Otherwise, throw a {@link ParseException}.

+ */

+ public long consumeInt64() throws ParseException {

+ try {

+ final long result = parseInt64(currentToken);

+ nextToken();

+ return result;

+ } catch (NumberFormatException e) {

+ throw integerParseException(e);

+ }

+ /**

+ * If the next token is a 64-bit signed integer, consume it and return

+ * {@code true}. Otherwise, return {@code false} without doing anything.

+ */

+ public boolean tryConsumeInt64() {

+ try {

+ consumeInt64();

+ return true;

+ } catch (ParseException e) {

+ return false;

+ }

+ /**

+ * If the next token is a 64-bit unsigned integer, consume it and return its

+ * value. Otherwise, throw a {@link ParseException}.

+ */

+ public long consumeUInt64() throws ParseException {

+ try {

+ final long result = parseUInt64(currentToken);

+ nextToken();

+ return result;

+ } catch (NumberFormatException e) {

+ throw integerParseException(e);

+ }

+ /**

+ * If the next token is a 64-bit unsigned integer, consume it and return

+ * {@code true}. Otherwise, return {@code false} without doing anything.

+ */

+ public boolean tryConsumeUInt64() {

+ try {

+ consumeUInt64();

+ return true;

+ } catch (ParseException e) {

+ return false;

+ }

+ /**

+ * If the next token is a double, consume it and return its value.

+ * Otherwise, throw a {@link ParseException}.

+ */

+ public double consumeDouble() throws ParseException {

+ // We need to parse infinity and nan separately because

+ // Double.parseDouble() does not accept "inf", "infinity", or "nan".

+ if (DOUBLE_INFINITY.matcher(currentToken).matches()) {

+ final boolean negative = currentToken.startsWith("-");

+ nextToken();

+ return negative ? Double.NEGATIVE_INFINITY : Double.POSITIVE_INFINITY;

+ }

+ if (currentToken.equalsIgnoreCase("nan")) {

+ nextToken();

+ return Double.NaN;

+ }

+ try {

+ final double result = Double.parseDouble(currentToken);

+ nextToken();

+ return result;

+ } catch (NumberFormatException e) {

+ throw floatParseException(e);

+ }

+ /**

+ * If the next token is a double, consume it and return {@code true}.

+ * Otherwise, return {@code false} without doing anything.

+ */

+ public boolean tryConsumeDouble() {

+ try {

+ consumeDouble();

+ return true;

+ } catch (ParseException e) {

+ return false;

+ }

+ /**

+ * If the next token is a float, consume it and return its value.

+ * Otherwise, throw a {@link ParseException}.

+ */

+ public float consumeFloat() throws ParseException {

+ // We need to parse infinity and nan separately because

+ // Float.parseFloat() does not accept "inf", "infinity", or "nan".

+ if (FLOAT_INFINITY.matcher(currentToken).matches()) {

+ final boolean negative = currentToken.startsWith("-");

+ nextToken();

+ return negative ? Float.NEGATIVE_INFINITY : Float.POSITIVE_INFINITY;

+ }

+ if (FLOAT_NAN.matcher(currentToken).matches()) {

+ nextToken();

+ return Float.NaN;

+ }

+ try {

+ final float result = Float.parseFloat(currentToken);

+ nextToken();

+ return result;

+ } catch (NumberFormatException e) {

+ throw floatParseException(e);

+ }

+ /**

+ * If the next token is a float, consume it and return {@code true}.

+ * Otherwise, return {@code false} without doing anything.

+ */

+ public boolean tryConsumeFloat() {

+ try {

+ consumeFloat();

+ return true;

+ } catch (ParseException e) {

+ return false;

+ }

+ /**

+ * If the next token is a boolean, consume it and return its value.

+ * Otherwise, throw a {@link ParseException}.

+ */

+ public boolean consumeBoolean() throws ParseException {

+ if (currentToken.equals("true")

+ || currentToken.equals("t")

+ || currentToken.equals("1")) {

+ nextToken();

+ return true;

+ } else if (currentToken.equals("false")

+ || currentToken.equals("f")

+ || currentToken.equals("0")) {

+ nextToken();

+ return false;

+ } else {

+ throw parseException("Expected \"true\" or \"false\".");

+ }

+ /**

+ * If the next token is a string, consume it and return its (unescaped)

+ * value. Otherwise, throw a {@link ParseException}.

+ */

+ public String consumeString() throws ParseException {

+ return consumeByteString().toStringUtf8();

+ }

+ /**

+ * If the next token is a string, consume it and return true. Otherwise,

+ * return false.

+ */

+ public boolean tryConsumeString() {

+ try {

+ consumeString();

+ return true;

+ } catch (ParseException e) {

+ return false;

+ }

+ /**

+ * If the next token is a string, consume it, unescape it as a

+ * {@link ByteString}, and return it. Otherwise, throw a

+ * {@link ParseException}.

+ */

+ public ByteString consumeByteString() throws ParseException {

+ List<ByteString> list = new ArrayList<ByteString>();

+ consumeByteString(list);

+ while (currentToken.startsWith("'") || currentToken.startsWith("\"")) {

+ consumeByteString(list);

+ }

+ return ByteString.copyFrom(list);

+ }

+ /**

+ * Like {@link #consumeByteString()} but adds each token of the string to

+ * the given list. String literals (whether bytes or text) may come in

+ * multiple adjacent tokens which are automatically concatenated, like in

+ * C or Python.

+ */

+ private void consumeByteString(List<ByteString> list)

+ throws ParseException {

+ final char quote = currentToken.length() > 0

+ ? currentToken.charAt(0)

+ : '\0';

+ if (quote != '\"' && quote != '\'') {

+ throw parseException("Expected string.");

+ }

+ if (currentToken.length() < 2

+ || currentToken.charAt(currentToken.length() - 1) != quote) {

+ throw parseException("String missing ending quote.");

+ }

+ try {

+ final String escaped =

+ currentToken.substring(1, currentToken.length() - 1);

+ final ByteString result = unescapeBytes(escaped);

+ nextToken();

+ list.add(result);

+ } catch (InvalidEscapeSequenceException e) {

+ throw parseException(e.getMessage());

+ }

+ /**

+ * Returns a {@link ParseException} with the current line and column

+ * numbers in the description, suitable for throwing.

+ */

+ public ParseException parseException(final String description) {

+ // Note: People generally prefer one-based line and column numbers.

+ return new ParseException(

+ line + 1, column + 1, description);

+ }

+ /**

+ * Returns a {@link ParseException} with the line and column numbers of

+ * the previous token in the description, suitable for throwing.

+ */

+ public ParseException parseExceptionPreviousToken(

+ final String description) {

+ // Note: People generally prefer one-based line and column numbers.

+ return new ParseException(

+ previousLine + 1, previousColumn + 1, description);

+ }

+ /**

+ * Constructs an appropriate {@link ParseException} for the given

+ * {@code NumberFormatException} when trying to parse an integer.

+ */

+ private ParseException integerParseException(

+ final NumberFormatException e) {

+ return parseException("Couldn't parse integer: " + e.getMessage());

+ }

+ /**

+ * Constructs an appropriate {@link ParseException} for the given

+ * {@code NumberFormatException} when trying to parse a float or double.

+ */

+ private ParseException floatParseException(final NumberFormatException e) {

+ return parseException("Couldn't parse number: " + e.getMessage());

+ }

+ /**

+ * Returns a {@link UnknownFieldParseException} with the line and column

+ * numbers of the previous token in the description, and the unknown field

+ * name, suitable for throwing.

+ */

+ public UnknownFieldParseException unknownFieldParseExceptionPreviousToken(

+ final String unknownField, final String description) {

+ // Note: People generally prefer one-based line and column numbers.

+ return new UnknownFieldParseException(

+ previousLine + 1, previousColumn + 1, unknownField, description);

+ }

+ /** Thrown when parsing an invalid text format message. */

+ public static class ParseException extends IOException {

+ private static final long serialVersionUID = 3196188060225107702L;

+ private final int line;

+ private final int column;

+ /** Create a new instance, with -1 as the line and column numbers. */

+ public ParseException(final String message) {

+ this(-1, -1, message);

+ }

+ /**

+ * Create a new instance

+ *

+ * @param line the line number where the parse error occurred,

+ * using 1-offset.

+ * @param column the column number where the parser error occurred,

+ * using 1-offset.

+ */

+ public ParseException(final int line, final int column,

+ final String message) {

+ super(Integer.toString(line) + ":" + column + ": " + message);

+ this.line = line;

+ this.column = column;

+ }

+ /**

+ * Return the line where the parse exception occurred, or -1 when

+ * none is provided. The value is specified as 1-offset, so the first

+ * line is line 1.

+ */

+ public int getLine() {

+ return line;

+ }

+ /**

+ * Return the column where the parse exception occurred, or -1 when

+ * none is provided. The value is specified as 1-offset, so the first

+ * line is line 1.

+ */

+ public int getColumn() {

+ return column;

+ }

+ /**

+ * Thrown when encountering an unknown field while parsing

+ * a text format message.

+ */

+ public static class UnknownFieldParseException extends ParseException {

+ private final String unknownField;

+ /**

+ * Create a new instance, with -1 as the line and column numbers, and an

+ * empty unknown field name.

+ */

+ public UnknownFieldParseException(final String message) {

+ this(-1, -1, "", message);

+ }

+ /**

+ * Create a new instance

+ *

+ * @param line the line number where the parse error occurred,

+ * using 1-offset.

+ * @param column the column number where the parser error occurred,

+ * using 1-offset.

+ * @param unknownField the name of the unknown field found while parsing.

+ */

+ public UnknownFieldParseException(final int line, final int column,

+ final String unknownField, final String message) {

+ super(line, column, message);

+ this.unknownField = unknownField;

+ }

+ /**

+ * Return the name of the unknown field encountered while parsing the

+ * protocol buffer string.

+ */

+ public String getUnknownField() {

+ return unknownField;

+ }

+ private static final Parser PARSER = Parser.newBuilder().build();

+ /**

+ * Return a {@link Parser} instance which can parse text-format

+ * messages. The returned instance is thread-safe.

+ */

+ public static Parser getParser() {

+ return PARSER;

+ }

+ /**

+ * Parse a text-format message from {@code input} and merge the contents

+ * into {@code builder}.

+ */

+ public static void merge(final Readable input,

+ final Message.Builder builder)

+ throws IOException {

+ PARSER.merge(input, builder);

+ }

+ /**

+ * Parse a text-format message from {@code input} and merge the contents

+ * into {@code builder}.

+ */

+ public static void merge(final CharSequence input,

+ final Message.Builder builder)

+ throws ParseException {

+ PARSER.merge(input, builder);

+ }

+ /**

+ * Parse a text-format message from {@code input} and merge the contents

+ * into {@code builder}. Extensions will be recognized if they are

+ * registered in {@code extensionRegistry}.

+ */

+ public static void merge(final Readable input,

+ final ExtensionRegistry extensionRegistry,

+ final Message.Builder builder)

+ throws IOException {

+ PARSER.merge(input, extensionRegistry, builder);

+ }

+ /**

+ * Parse a text-format message from {@code input} and merge the contents

+ * into {@code builder}. Extensions will be recognized if they are

+ * registered in {@code extensionRegistry}.

+ */

+ public static void merge(final CharSequence input,

+ final ExtensionRegistry extensionRegistry,

+ final Message.Builder builder)

+ throws ParseException {

+ PARSER.merge(input, extensionRegistry, builder);

+ }

+ /**

+ * Parser for text-format proto2 instances. This class is thread-safe.

+ * The implementation largely follows google/protobuf/text_format.cc.

+ *

+ * <p>Use {@link TextFormat#getParser()} to obtain the default parser, or

+ * {@link Builder} to control the parser behavior.

+ */

+ public static class Parser {

+ /**

+ * Determines if repeated values for non-repeated fields and

+ * oneofs are permitted. For example, given required/optional field "foo"

+ * and a oneof containing "baz" and "qux":

+ * <ul>

+ * <li>"foo: 1 foo: 2"

+ * <li>"baz: 1 qux: 2"

+ * <li>merging "foo: 2" into a proto in which foo is already set, or

+ * <li>merging "qux: 2" into a proto in which baz is already set.

+ * </ul>

+ */

+ public enum SingularOverwritePolicy {

+ /** The last value is retained. */

+ ALLOW_SINGULAR_OVERWRITES,

+ /** An error is issued. */

+ FORBID_SINGULAR_OVERWRITES

+ }

+ private final boolean allowUnknownFields;

+ private final SingularOverwritePolicy singularOverwritePolicy;

+ private Parser(boolean allowUnknownFields,

+ SingularOverwritePolicy singularOverwritePolicy) {

+ this.allowUnknownFields = allowUnknownFields;

+ this.singularOverwritePolicy = singularOverwritePolicy;

+ }

+ /**

+ * Returns a new instance of {@link Builder}.

+ */

+ public static Builder newBuilder() {

+ return new Builder();

+ }

+ /**

+ * Builder that can be used to obtain new instances of {@link Parser}.

+ */

+ public static class Builder {

+ private boolean allowUnknownFields = false;

+ private SingularOverwritePolicy singularOverwritePolicy =

+ SingularOverwritePolicy.ALLOW_SINGULAR_OVERWRITES;

+ /**

+ * Sets parser behavior when a non-repeated field appears more than once.

+ */

+ public Builder setSingularOverwritePolicy(SingularOverwritePolicy p) {

+ this.singularOverwritePolicy = p;

+ return this;

+ }

+ public Parser build() {

+ return new Parser(allowUnknownFields, singularOverwritePolicy);

+ }

+ /**

+ * Parse a text-format message from {@code input} and merge the contents

+ * into {@code builder}.

+ */

+ public void merge(final Readable input,

+ final Message.Builder builder)

+ throws IOException {

+ merge(input, ExtensionRegistry.getEmptyRegistry(), builder);

+ }

+ /**

+ * Parse a text-format message from {@code input} and merge the contents

+ * into {@code builder}.

+ */

+ public void merge(final CharSequence input,

+ final Message.Builder builder)

+ throws ParseException {

+ merge(input, ExtensionRegistry.getEmptyRegistry(), builder);

+ }

+ /**

+ * Parse a text-format message from {@code input} and merge the contents

+ * into {@code builder}. Extensions will be recognized if they are

+ * registered in {@code extensionRegistry}.

+ */

+ public void merge(final Readable input,

+ final ExtensionRegistry extensionRegistry,

+ final Message.Builder builder)

+ throws IOException {

+ // Read the entire input to a String then parse that.

+ // If StreamTokenizer were not quite so crippled, or if there were a kind

+ // of Reader that could read in chunks that match some particular regex,

+ // or if we wanted to write a custom Reader to tokenize our stream, then

+ // we would not have to read to one big String. Alas, none of these is

+ // the case. Oh well.

+ merge(toStringBuilder(input), extensionRegistry, builder);

+ }

+ private static final int BUFFER_SIZE = 4096;

+ // TODO(chrisn): See if working around java.io.Reader#read(CharBuffer)

+ // overhead is worthwhile

+ private static StringBuilder toStringBuilder(final Readable input)

+ throws IOException {

+ final StringBuilder text = new StringBuilder();

+ final CharBuffer buffer = CharBuffer.allocate(BUFFER_SIZE);

+ while (true) {

+ final int n = input.read(buffer);

+ if (n == -1) {

+ break;

+ }

+ buffer.flip();

+ text.append(buffer, 0, n);

+ }

+ return text;

+ }

+ /**

+ * Parse a text-format message from {@code input} and merge the contents

+ * into {@code builder}. Extensions will be recognized if they are

+ * registered in {@code extensionRegistry}.

+ */

+ public void merge(final CharSequence input,

+ final ExtensionRegistry extensionRegistry,

+ final Message.Builder builder)

+ throws ParseException {

+ final Tokenizer tokenizer = new Tokenizer(input);

+ MessageReflection.BuilderAdapter target =

+ new MessageReflection.BuilderAdapter(builder);

+ while (!tokenizer.atEnd()) {

+ mergeField(tokenizer, extensionRegistry, target);

+ }

+ /**

+ * Parse a single field from {@code tokenizer} and merge it into

+ * {@code builder}.

+ */

+ private void mergeField(final Tokenizer tokenizer,

+ final ExtensionRegistry extensionRegistry,

+ final MessageReflection.MergeTarget target)

+ throws ParseException {

+ FieldDescriptor field = null;

+ final Descriptor type = target.getDescriptorForType();

+ ExtensionRegistry.ExtensionInfo extension = null;

+ if (tokenizer.tryConsume("[")) {

+ // An extension.

+ final StringBuilder name =

+ new StringBuilder(tokenizer.consumeIdentifier());

+ while (tokenizer.tryConsume(".")) {

+ name.append('.');

+ name.append(tokenizer.consumeIdentifier());

+ }

+ extension = target.findExtensionByName(

+ extensionRegistry, name.toString());

+ if (extension == null) {

+ if (!allowUnknownFields) {

+ throw tokenizer.parseExceptionPreviousToken(

+ "Extension \"" + name + "\" not found in the ExtensionRegistry.");

+ } else {

+ logger.warning(

+ "Extension \"" + name + "\" not found in the ExtensionRegistry.");

+ }

+ } else {

+ if (extension.descriptor.getContainingType() != type) {

+ throw tokenizer.parseExceptionPreviousToken(

+ "Extension \"" + name + "\" does not extend message type \""

+ + type.getFullName() + "\".");

+ }

+ field = extension.descriptor;

+ }

+ tokenizer.consume("]");

+ } else {

+ final String name = tokenizer.consumeIdentifier();

+ field = type.findFieldByName(name);

+ // Group names are expected to be capitalized as they appear in the

+ // .proto file, which actually matches their type names, not their field

+ // names.

+ if (field == null) {

+ // Explicitly specify US locale so that this code does not break when

+ // executing in Turkey.

+ final String lowerName = name.toLowerCase(Locale.US);

+ field = type.findFieldByName(lowerName);

+ // If the case-insensitive match worked but the field is NOT a group,

+ if (field != null && field.getType() != FieldDescriptor.Type.GROUP) {

+ field = null;

+ }

+ // Again, special-case group names as described above.

+ if (field != null && field.getType() == FieldDescriptor.Type.GROUP

+ && !field.getMessageType().getName().equals(name)) {

+ field = null;

+ }

+ if (field == null) {

+ if (!allowUnknownFields) {

+ throw tokenizer.unknownFieldParseExceptionPreviousToken(

+ name,

+ "Message type \"" + type.getFullName()

+ + "\" has no field named \"" + name + "\".");

+ } else {

+ logger.warning(

+ "Message type \"" + type.getFullName()

+ + "\" has no field named \"" + name + "\".");

+ }

+ // Skips unknown fields.

+ if (field == null) {

+ // Try to guess the type of this field.

+ // If this field is not a message, there should be a ":" between the

+ // field name and the field value and also the field value should not

+ // start with "{" or "<" which indicates the beginning of a message body.

+ // If there is no ":" or there is a "{" or "<" after ":", this field has

+ // to be a message or the input is ill-formed.

+ if (tokenizer.tryConsume(":")

+ && !tokenizer.lookingAt("{")

+ && !tokenizer.lookingAt("<")) {

+ skipFieldValue(tokenizer);

+ } else {

+ skipFieldMessage(tokenizer);

+ }

+ return;

+ }

+ // Handle potential ':'.

+ if (field.getJavaType() == FieldDescriptor.JavaType.MESSAGE) {

+ tokenizer.tryConsume(":"); // optional

+ } else {

+ tokenizer.consume(":"); // required

+ }

+ // Support specifying repeated field values as a comma-separated list.

+ // Ex."foo: [1, 2, 3]"

+ if (field.isRepeated() && tokenizer.tryConsume("[")) {

+ while (true) {

+ consumeFieldValue(tokenizer, extensionRegistry, target, field, extension);

+ if (tokenizer.tryConsume("]")) {

+ // End of list.

+ break;

+ }

+ tokenizer.consume(",");

+ }

+ } else {

+ consumeFieldValue(tokenizer, extensionRegistry, target, field, extension);

+ }

+ // For historical reasons, fields may optionally be separated by commas or

+ // semicolons.

+ if (!tokenizer.tryConsume(";")) {

+ tokenizer.tryConsume(",");

+ }

+ /**

+ * Parse a single field value from {@code tokenizer} and merge it into

+ * {@code builder}.

+ */

+ private void consumeFieldValue(

+ final Tokenizer tokenizer,

+ final ExtensionRegistry extensionRegistry,

+ final MessageReflection.MergeTarget target,

+ final FieldDescriptor field,

+ final ExtensionRegistry.ExtensionInfo extension)

+ throws ParseException {

+ Object value = null;

+ if (field.getJavaType() == FieldDescriptor.JavaType.MESSAGE) {

+ final String endToken;

+ if (tokenizer.tryConsume("<")) {

+ endToken = ">";

+ } else {

+ tokenizer.consume("{");

+ endToken = "}";

+ }

+ final MessageReflection.MergeTarget subField;

+ subField = target.newMergeTargetForField(field,

+ (extension == null) ? null : extension.defaultInstance);

+ while (!tokenizer.tryConsume(endToken)) {

+ if (tokenizer.atEnd()) {

+ throw tokenizer.parseException(

+ "Expected \"" + endToken + "\".");

+ }

+ mergeField(tokenizer, extensionRegistry, subField);

+ }

+ value = subField.finish();

+ } else {

+ switch (field.getType()) {

+ case INT32:

+ case SINT32:

+ case SFIXED32:

+ value = tokenizer.consumeInt32();

+ break;

+ case INT64:

+ case SINT64:

+ case SFIXED64:

+ value = tokenizer.consumeInt64();

+ break;

+ case UINT32:

+ case FIXED32:

+ value = tokenizer.consumeUInt32();

+ break;

+ case UINT64:

+ case FIXED64:

+ value = tokenizer.consumeUInt64();

+ break;

+ case FLOAT:

+ value = tokenizer.consumeFloat();

+ break;

+ case DOUBLE:

+ value = tokenizer.consumeDouble();

+ break;

+ case BOOL:

+ value = tokenizer.consumeBoolean();

+ break;

+ case STRING:

+ value = tokenizer.consumeString();

+ break;

+ case BYTES:

+ value = tokenizer.consumeByteString();

+ break;

+ case ENUM:

+ final EnumDescriptor enumType = field.getEnumType();

+ if (tokenizer.lookingAtInteger()) {

+ final int number = tokenizer.consumeInt32();

+ value = enumType.findValueByNumber(number);

+ if (value == null) {

+ throw tokenizer.parseExceptionPreviousToken(

+ "Enum type \"" + enumType.getFullName()

+ + "\" has no value with number " + number + '.');

+ }

+ } else {

+ final String id = tokenizer.consumeIdentifier();

+ value = enumType.findValueByName(id);

+ if (value == null) {

+ throw tokenizer.parseExceptionPreviousToken(

+ "Enum type \"" + enumType.getFullName()

+ + "\" has no value named \"" + id + "\".");

+ }

+ break;

+ case MESSAGE:

+ case GROUP:

+ throw new RuntimeException("Can't get here.");

+ }

+ if (field.isRepeated()) {

+ target.addRepeatedField(field, value);

+ } else if ((singularOverwritePolicy

+ == SingularOverwritePolicy.FORBID_SINGULAR_OVERWRITES)

+ && target.hasField(field)) {

+ throw tokenizer.parseExceptionPreviousToken("Non-repeated field \""

+ + field.getFullName() + "\" cannot be overwritten.");

+ } else if ((singularOverwritePolicy

+ == SingularOverwritePolicy.FORBID_SINGULAR_OVERWRITES)

+ && field.getContainingOneof() != null

+ && target.hasOneof(field.getContainingOneof())) {

+ Descriptors.OneofDescriptor oneof = field.getContainingOneof();

+ throw tokenizer.parseExceptionPreviousToken("Field \""

+ + field.getFullName() + "\" is specified along with field \""

+ + target.getOneofFieldDescriptor(oneof).getFullName()

+ + "\", another member of oneof \"" + oneof.getName() + "\".");

+ } else {

+ target.setField(field, value);

+ }

+ /**

+ * Skips the next field including the field's name and value.

+ */

+ private void skipField(Tokenizer tokenizer) throws ParseException {

+ if (tokenizer.tryConsume("[")) {

+ // Extension name.

+ do {

+ tokenizer.consumeIdentifier();

+ } while (tokenizer.tryConsume("."));

+ tokenizer.consume("]");

+ } else {

+ tokenizer.consumeIdentifier();

+ }

+ // Try to guess the type of this field.

+ // If this field is not a message, there should be a ":" between the

+ // field name and the field value and also the field value should not

+ // start with "{" or "<" which indicates the beginning of a message body.

+ // If there is no ":" or there is a "{" or "<" after ":", this field has

+ // to be a message or the input is ill-formed.

+ if (tokenizer.tryConsume(":")

+ && !tokenizer.lookingAt("<")

+ && !tokenizer.lookingAt("{")) {

+ skipFieldValue(tokenizer);

+ } else {

+ skipFieldMessage(tokenizer);

+ }

+ // For historical reasons, fields may optionally be separated by commas or

+ // semicolons.

+ if (!tokenizer.tryConsume(";")) {

+ tokenizer.tryConsume(",");

+ }

+ /**

+ * Skips the whole body of a message including the beginning delimiter and

+ * the ending delimiter.

+ */

+ private void skipFieldMessage(Tokenizer tokenizer) throws ParseException {

+ final String delimiter;

+ if (tokenizer.tryConsume("<")) {

+ delimiter = ">";

+ } else {

+ tokenizer.consume("{");

+ delimiter = "}";

+ }

+ while (!tokenizer.lookingAt(">") && !tokenizer.lookingAt("}")) {

+ skipField(tokenizer);

+ }

+ tokenizer.consume(delimiter);

+ }

+ /**

+ * Skips a field value.

+ */

+ private void skipFieldValue(Tokenizer tokenizer) throws ParseException {

+ if (tokenizer.tryConsumeString()) {

+ while (tokenizer.tryConsumeString()) {}

+ return;

+ }

+ if (!tokenizer.tryConsumeIdentifier() // includes enum & boolean

+ && !tokenizer.tryConsumeInt64() // includes int32

+ && !tokenizer.tryConsumeUInt64() // includes uint32

+ && !tokenizer.tryConsumeDouble()

+ && !tokenizer.tryConsumeFloat()) {

+ throw tokenizer.parseException(

+ "Invalid field value: " + tokenizer.currentToken);

+ }

+ // =================================================================

+ // Utility functions

+ //

+ // Some of these methods are package-private because Descriptors.java uses

+ // them.

+ private interface ByteSequence {

+ int size();

+ byte byteAt(int offset);

+ }

+ /**

+ * Escapes bytes in the format used in protocol buffer text format, which

+ * is the same as the format used for C string literals. All bytes

+ * that are not printable 7-bit ASCII characters are escaped, as well as

+ * backslash, single-quote, and double-quote characters. Characters for

+ * which no defined short-hand escape sequence is defined will be escaped

+ * using 3-digit octal sequences.

+ */

+ public static String escapeBytes(final ByteSequence input) {

+ final StringBuilder builder = new StringBuilder(input.size());

+ for (int i = 0; i < input.size(); i++) {

+ final byte b = input.byteAt(i);

+ switch (b) {

+ // Java does not recognize \a or \v, apparently.

+ case 0x07: builder.append("\\a"); break;

+ case '\b': builder.append("\\b"); break;

+ case '\f': builder.append("\\f"); break;

+ case '\n': builder.append("\\n"); break;

+ case '\r': builder.append("\\r"); break;

+ case '\t': builder.append("\\t"); break;

+ case 0x0b: builder.append("\\v"); break;

+ case '\\': builder.append("\\\\"); break;

+ case '\'': builder.append("\\\'"); break;

+ case '"' : builder.append("\\\""); break;

+ default:

+ // Only ASCII characters between 0x20 (space) and 0x7e (tilde) are

+ // printable. Other byte values must be escaped.

+ if (b >= 0x20 && b <= 0x7e) {

+ builder.append((char) b);

+ } else {

+ builder.append('\\');

+ builder.append((char) ('0' + ((b >>> 6) & 3)));

+ builder.append((char) ('0' + ((b >>> 3) & 7)));

+ builder.append((char) ('0' + (b & 7)));

+ }

+ break;

+ }

+ return builder.toString();

+ }

+ /**

+ * Escapes bytes in the format used in protocol buffer text format, which

+ * is the same as the format used for C string literals. All bytes

+ * that are not printable 7-bit ASCII characters are escaped, as well as

+ * backslash, single-quote, and double-quote characters. Characters for

+ * which no defined short-hand escape sequence is defined will be escaped

+ * using 3-digit octal sequences.

+ */

+ public static String escapeBytes(final ByteString input) {

+ return escapeBytes(new ByteSequence() {

+ @Override

+ public int size() {

+ return input.size();

+ }

+ @Override

+ public byte byteAt(int offset) {

+ return input.byteAt(offset);

+ }

+ });

+ }

+ /**

+ * Like {@link #escapeBytes(ByteString)}, but used for byte array.

+ */

+ public static String escapeBytes(final byte[] input) {

+ return escapeBytes(new ByteSequence() {

+ @Override

+ public int size() {

+ return input.length;

+ }

+ @Override

+ public byte byteAt(int offset) {

+ return input[offset];

+ }

+ });

+ }

+ /**

+ * Un-escape a byte sequence as escaped using

+ * {@link #escapeBytes(ByteString)}. Two-digit hex escapes (starting with

+ * "\x") are also recognized.

+ */

+ public static ByteString unescapeBytes(final CharSequence charString)

+ throws InvalidEscapeSequenceException {

+ // First convert the Java character sequence to UTF-8 bytes.

+ ByteString input = ByteString.copyFromUtf8(charString.toString());

+ // Then unescape certain byte sequences introduced by ASCII '\\'. The valid

+ // escapes can all be expressed with ASCII characters, so it is safe to

+ // operate on bytes here.

+ //

+ // Unescaping the input byte array will result in a byte sequence that's no

+ // longer than the input. That's because each escape sequence is between

+ // two and four bytes long and stands for a single byte.

+ final byte[] result = new byte[input.size()];

+ int pos = 0;

+ for (int i = 0; i < input.size(); i++) {

+ byte c = input.byteAt(i);

+ if (c == '\\') {

+ if (i + 1 < input.size()) {

+ ++i;

+ c = input.byteAt(i);

+ if (isOctal(c)) {

+ // Octal escape.

+ int code = digitValue(c);

+ if (i + 1 < input.size() && isOctal(input.byteAt(i + 1))) {

+ ++i;

+ code = code * 8 + digitValue(input.byteAt(i));

+ }

+ if (i + 1 < input.size() && isOctal(input.byteAt(i + 1))) {

+ ++i;

+ code = code * 8 + digitValue(input.byteAt(i));

+ }

+ // TODO: Check that 0 <= code && code <= 0xFF.

+ result[pos++] = (byte) code;

+ } else {

+ switch (c) {

+ case 'a' : result[pos++] = 0x07; break;

+ case 'b' : result[pos++] = '\b'; break;

+ case 'f' : result[pos++] = '\f'; break;

+ case 'n' : result[pos++] = '\n'; break;

+ case 'r' : result[pos++] = '\r'; break;

+ case 't' : result[pos++] = '\t'; break;

+ case 'v' : result[pos++] = 0x0b; break;

+ case '\\': result[pos++] = '\\'; break;

+ case '\'': result[pos++] = '\''; break;

+ case '"' : result[pos++] = '\"'; break;

+ case 'x':

+ // hex escape

+ int code = 0;

+ if (i + 1 < input.size() && isHex(input.byteAt(i + 1))) {

+ ++i;

+ code = digitValue(input.byteAt(i));

+ } else {

+ throw new InvalidEscapeSequenceException(

+ "Invalid escape sequence: '\\x' with no digits");

+ }

+ if (i + 1 < input.size() && isHex(input.byteAt(i + 1))) {

+ ++i;

+ code = code * 16 + digitValue(input.byteAt(i));

+ }

+ result[pos++] = (byte) code;

+ break;

+ default:

+ throw new InvalidEscapeSequenceException(

+ "Invalid escape sequence: '\\" + (char) c + '\'');

+ }

+ } else {

+ throw new InvalidEscapeSequenceException(

+ "Invalid escape sequence: '\\' at end of string.");

+ }

+ } else {

+ result[pos++] = c;

+ }

+ return ByteString.copyFrom(result, 0, pos);

+ }

+ /**

+ * Thrown by {@link TextFormat#unescapeBytes} and

+ * {@link TextFormat#unescapeText} when an invalid escape sequence is seen.

+ */

+ public static class InvalidEscapeSequenceException extends IOException {

+ private static final long serialVersionUID = -8164033650142593304L;

+ InvalidEscapeSequenceException(final String description) {

+ super(description);

+ }

+ /**

+ * Like {@link #escapeBytes(ByteString)}, but escapes a text string.

+ * Non-ASCII characters are first encoded as UTF-8, then each byte is escaped

+ * individually as a 3-digit octal escape. Yes, it's weird.

+ */

+ static String escapeText(final String input) {

+ return escapeBytes(ByteString.copyFromUtf8(input));

+ }

+ /**

+ * Escape double quotes and backslashes in a String for unicode output of a message.

+ */

+ public static String escapeDoubleQuotesAndBackslashes(final String input) {

+ return input.replace("\\", "\\\\").replace("\"", "\\\"");

+ }

+ /**

+ * Un-escape a text string as escaped using {@link #escapeText(String)}.

+ * Two-digit hex escapes (starting with "\x") are also recognized.

+ */

+ static String unescapeText(final String input)

+ throws InvalidEscapeSequenceException {

+ return unescapeBytes(input).toStringUtf8();

+ }

+ /** Is this an octal digit? */

+ private static boolean isOctal(final byte c) {

+ return '0' <= c && c <= '7';

+ }

+ /** Is this a hex digit? */

+ private static boolean isHex(final byte c) {

+ return ('0' <= c && c <= '9')

+ || ('a' <= c && c <= 'f')

+ || ('A' <= c && c <= 'F');

+ }

+ /**

+ * Interpret a character as a digit (in any base up to 36) and return the

+ * numeric value. This is like {@code Character.digit()} but we don't accept

+ * non-ASCII digits.

+ */

+ private static int digitValue(final byte c) {

+ if ('0' <= c && c <= '9') {

+ return c - '0';

+ } else if ('a' <= c && c <= 'z') {

+ return c - 'a' + 10;

+ } else {

+ return c - 'A' + 10;

+ }

+ /**

+ * Parse a 32-bit signed integer from the text. Unlike the Java standard

+ * {@code Integer.parseInt()}, this function recognizes the prefixes "0x"

+ * and "0" to signify hexadecimal and octal numbers, respectively.

+ */

+ static int parseInt32(final String text) throws NumberFormatException {

+ return (int) parseInteger(text, true, false);

+ }

+ /**

+ * Parse a 32-bit unsigned integer from the text. Unlike the Java standard

+ * {@code Integer.parseInt()}, this function recognizes the prefixes "0x"

+ * and "0" to signify hexadecimal and octal numbers, respectively. The

+ * result is coerced to a (signed) {@code int} when returned since Java has

+ * no unsigned integer type.

+ */

+ static int parseUInt32(final String text) throws NumberFormatException {

+ return (int) parseInteger(text, false, false);

+ }

+ /**

+ * Parse a 64-bit signed integer from the text. Unlike the Java standard

+ * {@code Integer.parseInt()}, this function recognizes the prefixes "0x"

+ * and "0" to signify hexadecimal and octal numbers, respectively.

+ */

+ static long parseInt64(final String text) throws NumberFormatException {

+ return parseInteger(text, true, true);

+ }

+ /**

+ * Parse a 64-bit unsigned integer from the text. Unlike the Java standard

+ * {@code Integer.parseInt()}, this function recognizes the prefixes "0x"

+ * and "0" to signify hexadecimal and octal numbers, respectively. The

+ * result is coerced to a (signed) {@code long} when returned since Java has

+ * no unsigned long type.

+ */

+ static long parseUInt64(final String text) throws NumberFormatException {

+ return parseInteger(text, false, true);

+ }

+ private static long parseInteger(final String text,

+ final boolean isSigned,

+ final boolean isLong)

+ throws NumberFormatException {

+ int pos = 0;

+ boolean negative = false;

+ if (text.startsWith("-", pos)) {

+ if (!isSigned) {

+ throw new NumberFormatException("Number must be positive: " + text);

+ }

+ ++pos;

+ negative = true;

+ }

+ int radix = 10;

+ if (text.startsWith("0x", pos)) {

+ pos += 2;

+ radix = 16;

+ } else if (text.startsWith("0", pos)) {

+ radix = 8;

+ }

+ final String numberText = text.substring(pos);

+ long result = 0;

+ if (numberText.length() < 16) {

+ // Can safely assume no overflow.

+ result = Long.parseLong(numberText, radix);

+ if (negative) {

+ result = -result;

+ }

+ // Check bounds.

+ // No need to check for 64-bit numbers since they'd have to be 16 chars

+ // or longer to overflow.

+ if (!isLong) {

+ if (isSigned) {

+ if (result > Integer.MAX_VALUE || result < Integer.MIN_VALUE) {

+ throw new NumberFormatException(

+ "Number out of range for 32-bit signed integer: " + text);

+ }

+ } else {

+ if (result >= (1L << 32) || result < 0) {

+ throw new NumberFormatException(

+ "Number out of range for 32-bit unsigned integer: " + text);

+ }

+ } else {

+ BigInteger bigValue = new BigInteger(numberText, radix);

+ if (negative) {

+ bigValue = bigValue.negate();

+ }

+ // Check bounds.

+ if (!isLong) {

+ if (isSigned) {

+ if (bigValue.bitLength() > 31) {

+ throw new NumberFormatException(

+ "Number out of range for 32-bit signed integer: " + text);

+ }

+ } else {

+ if (bigValue.bitLength() > 32) {

+ throw new NumberFormatException(

+ "Number out of range for 32-bit unsigned integer: " + text);

+ }

+ } else {

+ if (isSigned) {

+ if (bigValue.bitLength() > 63) {

+ throw new NumberFormatException(

+ "Number out of range for 64-bit signed integer: " + text);

+ }

+ } else {

+ if (bigValue.bitLength() > 64) {

+ throw new NumberFormatException(

+ "Number out of range for 64-bit unsigned integer: " + text);

+ }

+ result = bigValue.longValue();

+ }

+ return result;

+ }