third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java - Issue 556933002: Remove protobuf lite for java.

Unified Diff: third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java

Issue 556933002: Remove protobuf lite for java. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: Rebase before submit Created 6 years, 3 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« no previous file with comments | « third_party/protobuf/java/src/main/java/com/google/protobuf/SmallSortedMap.java ('k') | third_party/protobuf/java/src/main/java/com/google/protobuf/UninitializedMessageException.java » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java

diff --git a/third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java b/third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java

deleted file mode 100644

index ed4628994f904699ecada4c9318997d9783be514..0000000000000000000000000000000000000000

--- a/third_party/protobuf/java/src/main/java/com/google/protobuf/TextFormat.java

+++ /dev/null

@@ -1,1559 +0,0 @@

-// Protocol Buffers - Google's data interchange format

-// http://code.google.com/p/protobuf/

-//

-// Redistribution and use in source and binary forms, with or without

-// modification, are permitted provided that the following conditions are

-// met:

-//

-// * Redistributions of source code must retain the above copyright

-// notice, this list of conditions and the following disclaimer.

-// * Redistributions in binary form must reproduce the above

-// copyright notice, this list of conditions and the following disclaimer

-// in the documentation and/or other materials provided with the

-// distribution.

-// * Neither the name of Google Inc. nor the names of its

-// contributors may be used to endorse or promote products derived from

-// this software without specific prior written permission.

-//

-// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

-// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

-// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR

-// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT

-// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

-// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT

-// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

-// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

-// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

-// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

-// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

-package com.google.protobuf;

-import com.google.protobuf.Descriptors.Descriptor;

-import com.google.protobuf.Descriptors.FieldDescriptor;

-import com.google.protobuf.Descriptors.EnumDescriptor;

-import com.google.protobuf.Descriptors.EnumValueDescriptor;

-import java.io.IOException;

-import java.nio.CharBuffer;

-import java.math.BigInteger;

-import java.util.ArrayList;

-import java.util.List;

-import java.util.Locale;

-import java.util.Map;

-import java.util.regex.Matcher;

-import java.util.regex.Pattern;

-/**

- * Provide text parsing and formatting support for proto2 instances.

- * The implementation largely follows google/protobuf/text_format.cc.

- *

- * @author wenboz@google.com Wenbo Zhu

- * @author kenton@google.com Kenton Varda

- */

-public final class TextFormat {

- private TextFormat() {}

- private static final Printer DEFAULT_PRINTER = new Printer();

- private static final Printer SINGLE_LINE_PRINTER =

- (new Printer()).setSingleLineMode(true);

- private static final Printer UNICODE_PRINTER =

- (new Printer()).setEscapeNonAscii(false);

- /**

- * Outputs a textual representation of the Protocol Message supplied into

- * the parameter output. (This representation is the new version of the

- * classic "ProtocolPrinter" output from the original Protocol Buffer system)

- */

- public static void print(final MessageOrBuilder message, final Appendable output)

- throws IOException {

- DEFAULT_PRINTER.print(message, new TextGenerator(output));

- }

- /** Outputs a textual representation of {@code fields} to {@code output}. */

- public static void print(final UnknownFieldSet fields,

- final Appendable output)

- throws IOException {

- DEFAULT_PRINTER.printUnknownFields(fields, new TextGenerator(output));

- }

- /**

- * Generates a human readable form of this message, useful for debugging and

- * other purposes, with no newline characters.

- */

- public static String shortDebugString(final MessageOrBuilder message) {

- try {

- final StringBuilder sb = new StringBuilder();

- SINGLE_LINE_PRINTER.print(message, new TextGenerator(sb));

- // Single line mode currently might have an extra space at the end.

- return sb.toString().trim();

- } catch (IOException e) {

- throw new IllegalStateException(e);

- }

- /**

- * Generates a human readable form of the unknown fields, useful for debugging

- * and other purposes, with no newline characters.

- */

- public static String shortDebugString(final UnknownFieldSet fields) {

- try {

- final StringBuilder sb = new StringBuilder();

- SINGLE_LINE_PRINTER.printUnknownFields(fields, new TextGenerator(sb));

- // Single line mode currently might have an extra space at the end.

- return sb.toString().trim();

- } catch (IOException e) {

- throw new IllegalStateException(e);

- }

- /**

- * Like {@code print()}, but writes directly to a {@code String} and

- * returns it.

- */

- public static String printToString(final MessageOrBuilder message) {

- try {

- final StringBuilder text = new StringBuilder();

- print(message, text);

- return text.toString();

- } catch (IOException e) {

- throw new IllegalStateException(e);

- }

- /**

- * Like {@code print()}, but writes directly to a {@code String} and

- * returns it.

- */

- public static String printToString(final UnknownFieldSet fields) {

- try {

- final StringBuilder text = new StringBuilder();

- print(fields, text);

- return text.toString();

- } catch (IOException e) {

- throw new IllegalStateException(e);

- }

- /**

- * Same as {@code printToString()}, except that non-ASCII characters

- * in string type fields are not escaped in backslash+octals.

- */

- public static String printToUnicodeString(final MessageOrBuilder message) {

- try {

- final StringBuilder text = new StringBuilder();

- UNICODE_PRINTER.print(message, new TextGenerator(text));

- return text.toString();

- } catch (IOException e) {

- throw new IllegalStateException(e);

- }

- /**

- * Same as {@code printToString()}, except that non-ASCII characters

- * in string type fields are not escaped in backslash+octals.

- */

- public static String printToUnicodeString(final UnknownFieldSet fields) {

- try {

- final StringBuilder text = new StringBuilder();

- UNICODE_PRINTER.printUnknownFields(fields, new TextGenerator(text));

- return text.toString();

- } catch (IOException e) {

- throw new IllegalStateException(e);

- }

- public static void printField(final FieldDescriptor field,

- final Object value,

- final Appendable output)

- throws IOException {

- DEFAULT_PRINTER.printField(field, value, new TextGenerator(output));

- }

- public static String printFieldToString(final FieldDescriptor field,

- final Object value) {

- try {

- final StringBuilder text = new StringBuilder();

- printField(field, value, text);

- return text.toString();

- } catch (IOException e) {

- throw new IllegalStateException(e);

- }

- /**

- * Outputs a textual representation of the value of given field value.

- *

- * @param field the descriptor of the field

- * @param value the value of the field

- * @param output the output to which to append the formatted value

- * @throws ClassCastException if the value is not appropriate for the

- * given field descriptor

- * @throws IOException if there is an exception writing to the output

- */

- public static void printFieldValue(final FieldDescriptor field,

- final Object value,

- final Appendable output)

- throws IOException {

- DEFAULT_PRINTER.printFieldValue(field, value, new TextGenerator(output));

- }

- /**

- * Outputs a textual representation of the value of an unknown field.

- *

- * @param tag the field's tag number

- * @param value the value of the field

- * @param output the output to which to append the formatted value

- * @throws ClassCastException if the value is not appropriate for the

- * given field descriptor

- * @throws IOException if there is an exception writing to the output

- */

- public static void printUnknownFieldValue(final int tag,

- final Object value,

- final Appendable output)

- throws IOException {

- printUnknownFieldValue(tag, value, new TextGenerator(output));

- }

- private static void printUnknownFieldValue(final int tag,

- final Object value,

- final TextGenerator generator)

- throws IOException {

- switch (WireFormat.getTagWireType(tag)) {

- case WireFormat.WIRETYPE_VARINT:

- generator.print(unsignedToString((Long) value));

- break;

- case WireFormat.WIRETYPE_FIXED32:

- generator.print(

- String.format((Locale) null, "0x%08x", (Integer) value));

- break;

- case WireFormat.WIRETYPE_FIXED64:

- generator.print(String.format((Locale) null, "0x%016x", (Long) value));

- break;

- case WireFormat.WIRETYPE_LENGTH_DELIMITED:

- generator.print("\"");

- generator.print(escapeBytes((ByteString) value));

- generator.print("\"");

- break;

- case WireFormat.WIRETYPE_START_GROUP:

- DEFAULT_PRINTER.printUnknownFields((UnknownFieldSet) value, generator);

- break;

- default:

- throw new IllegalArgumentException("Bad tag: " + tag);

- }

- /** Helper class for converting protobufs to text. */

- private static final class Printer {

- /** Whether to omit newlines from the output. */

- boolean singleLineMode = false;

- /** Whether to escape non ASCII characters with backslash and octal. */

- boolean escapeNonAscii = true;

- private Printer() {}

- /** Setter of singleLineMode */

- private Printer setSingleLineMode(boolean singleLineMode) {

- this.singleLineMode = singleLineMode;

- return this;

- }

- /** Setter of escapeNonAscii */

- private Printer setEscapeNonAscii(boolean escapeNonAscii) {

- this.escapeNonAscii = escapeNonAscii;

- return this;

- }

- private void print(final MessageOrBuilder message, final TextGenerator generator)

- throws IOException {

- for (Map.Entry<FieldDescriptor, Object> field

- : message.getAllFields().entrySet()) {

- printField(field.getKey(), field.getValue(), generator);

- }

- printUnknownFields(message.getUnknownFields(), generator);

- }

- private void printField(final FieldDescriptor field, final Object value,

- final TextGenerator generator) throws IOException {

- if (field.isRepeated()) {

- // Repeated field. Print each element.

- for (Object element : (List<?>) value) {

- printSingleField(field, element, generator);

- }

- } else {

- printSingleField(field, value, generator);

- }

- private void printSingleField(final FieldDescriptor field,

- final Object value,

- final TextGenerator generator)

- throws IOException {

- if (field.isExtension()) {

- generator.print("[");

- // We special-case MessageSet elements for compatibility with proto1.

- if (field.getContainingType().getOptions().getMessageSetWireFormat()

- && (field.getType() == FieldDescriptor.Type.MESSAGE)

- && (field.isOptional())

- // object equality

- && (field.getExtensionScope() == field.getMessageType())) {

- generator.print(field.getMessageType().getFullName());

- } else {

- generator.print(field.getFullName());

- }

- generator.print("]");

- } else {

- if (field.getType() == FieldDescriptor.Type.GROUP) {

- // Groups must be serialized with their original capitalization.

- generator.print(field.getMessageType().getName());

- } else {

- generator.print(field.getName());

- }

- if (field.getJavaType() == FieldDescriptor.JavaType.MESSAGE) {

- if (singleLineMode) {

- generator.print(" { ");

- } else {

- generator.print(" {\n");

- generator.indent();

- }

- } else {

- generator.print(": ");

- }

- printFieldValue(field, value, generator);

- if (field.getJavaType() == FieldDescriptor.JavaType.MESSAGE) {

- if (singleLineMode) {

- generator.print("} ");

- } else {

- generator.outdent();

- generator.print("}\n");

- }

- } else {

- if (singleLineMode) {

- generator.print(" ");

- } else {

- generator.print("\n");

- }

- private void printFieldValue(final FieldDescriptor field,

- final Object value,

- final TextGenerator generator)

- throws IOException {

- switch (field.getType()) {

- case INT32:

- case SINT32:

- case SFIXED32:

- generator.print(((Integer) value).toString());

- break;

- case INT64:

- case SINT64:

- case SFIXED64:

- generator.print(((Long) value).toString());

- break;

- case BOOL:

- generator.print(((Boolean) value).toString());

- break;

- case FLOAT:

- generator.print(((Float) value).toString());

- break;

- case DOUBLE:

- generator.print(((Double) value).toString());

- break;

- case UINT32:

- case FIXED32:

- generator.print(unsignedToString((Integer) value));

- break;

- case UINT64:

- case FIXED64:

- generator.print(unsignedToString((Long) value));

- break;

- case STRING:

- generator.print("\"");

- generator.print(escapeNonAscii ?

- escapeText((String) value) :

- (String) value);

- generator.print("\"");

- break;

- case BYTES:

- generator.print("\"");

- generator.print(escapeBytes((ByteString) value));

- generator.print("\"");

- break;

- case ENUM:

- generator.print(((EnumValueDescriptor) value).getName());

- break;

- case MESSAGE:

- case GROUP:

- print((Message) value, generator);

- break;

- }

- private void printUnknownFields(final UnknownFieldSet unknownFields,

- final TextGenerator generator)

- throws IOException {

- for (Map.Entry<Integer, UnknownFieldSet.Field> entry :

- unknownFields.asMap().entrySet()) {

- final int number = entry.getKey();

- final UnknownFieldSet.Field field = entry.getValue();

- printUnknownField(number, WireFormat.WIRETYPE_VARINT,

- field.getVarintList(), generator);

- printUnknownField(number, WireFormat.WIRETYPE_FIXED32,

- field.getFixed32List(), generator);

- printUnknownField(number, WireFormat.WIRETYPE_FIXED64,

- field.getFixed64List(), generator);

- printUnknownField(number, WireFormat.WIRETYPE_LENGTH_DELIMITED,

- field.getLengthDelimitedList(), generator);

- for (final UnknownFieldSet value : field.getGroupList()) {

- generator.print(entry.getKey().toString());

- if (singleLineMode) {

- generator.print(" { ");

- } else {

- generator.print(" {\n");

- generator.indent();

- }

- printUnknownFields(value, generator);

- if (singleLineMode) {

- generator.print("} ");

- } else {

- generator.outdent();

- generator.print("}\n");

- }

- private void printUnknownField(final int number,

- final int wireType,

- final List<?> values,

- final TextGenerator generator)

- throws IOException {

- for (final Object value : values) {

- generator.print(String.valueOf(number));

- generator.print(": ");

- printUnknownFieldValue(wireType, value, generator);

- generator.print(singleLineMode ? " " : "\n");

- }

- /** Convert an unsigned 32-bit integer to a string. */

- private static String unsignedToString(final int value) {

- if (value >= 0) {

- return Integer.toString(value);

- } else {

- return Long.toString(((long) value) & 0x00000000FFFFFFFFL);

- }

- /** Convert an unsigned 64-bit integer to a string. */

- private static String unsignedToString(final long value) {

- if (value >= 0) {

- return Long.toString(value);

- } else {

- // Pull off the most-significant bit so that BigInteger doesn't think

- // the number is negative, then set it again using setBit().

- return BigInteger.valueOf(value & 0x7FFFFFFFFFFFFFFFL)

- .setBit(63).toString();

- }

- /**

- * An inner class for writing text to the output stream.

- */

- private static final class TextGenerator {

- private final Appendable output;

- private final StringBuilder indent = new StringBuilder();

- private boolean atStartOfLine = true;

- private TextGenerator(final Appendable output) {

- this.output = output;

- }

- /**

- * Indent text by two spaces. After calling Indent(), two spaces will be

- * inserted at the beginning of each line of text. Indent() may be called

- * multiple times to produce deeper indents.

- */

- public void indent() {

- indent.append(" ");

- }

- /**

- * Reduces the current indent level by two spaces, or crashes if the indent

- * level is zero.

- */

- public void outdent() {

- final int length = indent.length();

- if (length == 0) {

- throw new IllegalArgumentException(

- " Outdent() without matching Indent().");

- }

- indent.delete(length - 2, length);

- }

- /**

- * Print text to the output stream.

- */

- public void print(final CharSequence text) throws IOException {

- final int size = text.length();

- int pos = 0;

- for (int i = 0; i < size; i++) {

- if (text.charAt(i) == '\n') {

- write(text.subSequence(pos, size), i - pos + 1);

- pos = i + 1;

- atStartOfLine = true;

- }

- write(text.subSequence(pos, size), size - pos);

- }

- private void write(final CharSequence data, final int size)

- throws IOException {

- if (size == 0) {

- return;

- }

- if (atStartOfLine) {

- atStartOfLine = false;

- output.append(indent);

- }

- output.append(data);

- }

- // =================================================================

- // Parsing

- /**

- * Represents a stream of tokens parsed from a {@code String}.

- *

- * <p>The Java standard library provides many classes that you might think

- * would be useful for implementing this, but aren't. For example:

- *

- * <ul>

- * <li>{@code java.io.StreamTokenizer}: This almost does what we want -- or,

- * at least, something that would get us close to what we want -- except

- * for one fatal flaw: It automatically un-escapes strings using Java

- * escape sequences, which do not include all the escape sequences we

- * need to support (e.g. '\x').

- * <li>{@code java.util.Scanner}: This seems like a great way at least to

- * parse regular expressions out of a stream (so we wouldn't have to load

- * the entire input into a single string before parsing). Sadly,

- * {@code Scanner} requires that tokens be delimited with some delimiter.

- * Thus, although the text "foo:" should parse to two tokens ("foo" and

- * ":"), {@code Scanner} would recognize it only as a single token.

- * Furthermore, {@code Scanner} provides no way to inspect the contents

- * of delimiters, making it impossible to keep track of line and column

- * numbers.

- * </ul>

- *

- * <p>Luckily, Java's regular expression support does manage to be useful to

- * us. (Barely: We need {@code Matcher.usePattern()}, which is new in

- * Java 1.5.) So, we can use that, at least. Unfortunately, this implies

- * that we need to have the entire input in one contiguous string.

- */

- private static final class Tokenizer {

- private final CharSequence text;

- private final Matcher matcher;

- private String currentToken;

- // The character index within this.text at which the current token begins.

- private int pos = 0;

- // The line and column numbers of the current token.

- private int line = 0;

- private int column = 0;

- // The line and column numbers of the previous token (allows throwing

- // errors *after* consuming).

- private int previousLine = 0;

- private int previousColumn = 0;

- // We use possessive quantifiers (*+ and ++) because otherwise the Java

- // regex matcher has stack overflows on large inputs.

- private static final Pattern WHITESPACE =

- Pattern.compile("(\\s|(#.*$))++", Pattern.MULTILINE);

- private static final Pattern TOKEN = Pattern.compile(

- "[a-zA-Z_][0-9a-zA-Z_+-]*+|" + // an identifier

- "[.]?[0-9+-][0-9a-zA-Z_.+-]*+|" + // a number

- "\"([^\"\n\\\\]|\\\\.)*+(\"|\\\\?$)|" + // a double-quoted string

- "\'([^\'\n\\\\]|\\\\.)*+(\'|\\\\?$)", // a single-quoted string

- Pattern.MULTILINE);

- private static final Pattern DOUBLE_INFINITY = Pattern.compile(

- "-?inf(inity)?",

- Pattern.CASE_INSENSITIVE);

- private static final Pattern FLOAT_INFINITY = Pattern.compile(

- "-?inf(inity)?f?",

- Pattern.CASE_INSENSITIVE);

- private static final Pattern FLOAT_NAN = Pattern.compile(

- "nanf?",

- Pattern.CASE_INSENSITIVE);

- /** Construct a tokenizer that parses tokens from the given text. */

- private Tokenizer(final CharSequence text) {

- this.text = text;

- this.matcher = WHITESPACE.matcher(text);

- skipWhitespace();

- nextToken();

- }

- /** Are we at the end of the input? */

- public boolean atEnd() {

- return currentToken.length() == 0;

- }

- /** Advance to the next token. */

- public void nextToken() {

- previousLine = line;

- previousColumn = column;

- // Advance the line counter to the current position.

- while (pos < matcher.regionStart()) {

- if (text.charAt(pos) == '\n') {

- ++line;

- column = 0;

- } else {

- ++column;

- }

- ++pos;

- }

- // Match the next token.

- if (matcher.regionStart() == matcher.regionEnd()) {

- // EOF

- currentToken = "";

- } else {

- matcher.usePattern(TOKEN);

- if (matcher.lookingAt()) {

- currentToken = matcher.group();

- matcher.region(matcher.end(), matcher.regionEnd());

- } else {

- // Take one character.

- currentToken = String.valueOf(text.charAt(pos));

- matcher.region(pos + 1, matcher.regionEnd());

- }

- skipWhitespace();

- }

- /**

- * Skip over any whitespace so that the matcher region starts at the next

- * token.

- */

- private void skipWhitespace() {

- matcher.usePattern(WHITESPACE);

- if (matcher.lookingAt()) {

- matcher.region(matcher.end(), matcher.regionEnd());

- }

- /**

- * If the next token exactly matches {@code token}, consume it and return

- * {@code true}. Otherwise, return {@code false} without doing anything.

- */

- public boolean tryConsume(final String token) {

- if (currentToken.equals(token)) {

- nextToken();

- return true;

- } else {

- return false;

- }

- /**

- * If the next token exactly matches {@code token}, consume it. Otherwise,

- * throw a {@link ParseException}.

- */

- public void consume(final String token) throws ParseException {

- if (!tryConsume(token)) {

- throw parseException("Expected \"" + token + "\".");

- }

- /**

- * Returns {@code true} if the next token is an integer, but does

- * not consume it.

- */

- public boolean lookingAtInteger() {

- if (currentToken.length() == 0) {

- return false;

- }

- final char c = currentToken.charAt(0);

- return ('0' <= c && c <= '9') ||

- c == '-' || c == '+';

- }

- /**

- * If the next token is an identifier, consume it and return its value.

- * Otherwise, throw a {@link ParseException}.

- */

- public String consumeIdentifier() throws ParseException {

- for (int i = 0; i < currentToken.length(); i++) {

- final char c = currentToken.charAt(i);

- if (('a' <= c && c <= 'z') ||

- ('A' <= c && c <= 'Z') ||

- ('0' <= c && c <= '9') ||

- (c == '_') || (c == '.')) {

- // OK

- } else {

- throw parseException("Expected identifier.");

- }

- final String result = currentToken;

- nextToken();

- return result;

- }

- /**

- * If the next token is a 32-bit signed integer, consume it and return its

- * value. Otherwise, throw a {@link ParseException}.

- */

- public int consumeInt32() throws ParseException {

- try {

- final int result = parseInt32(currentToken);

- nextToken();

- return result;

- } catch (NumberFormatException e) {

- throw integerParseException(e);

- }

- /**

- * If the next token is a 32-bit unsigned integer, consume it and return its

- * value. Otherwise, throw a {@link ParseException}.

- */

- public int consumeUInt32() throws ParseException {

- try {

- final int result = parseUInt32(currentToken);

- nextToken();

- return result;

- } catch (NumberFormatException e) {

- throw integerParseException(e);

- }

- /**

- * If the next token is a 64-bit signed integer, consume it and return its

- * value. Otherwise, throw a {@link ParseException}.

- */

- public long consumeInt64() throws ParseException {

- try {

- final long result = parseInt64(currentToken);

- nextToken();

- return result;

- } catch (NumberFormatException e) {

- throw integerParseException(e);

- }

- /**

- * If the next token is a 64-bit unsigned integer, consume it and return its

- * value. Otherwise, throw a {@link ParseException}.

- */

- public long consumeUInt64() throws ParseException {

- try {

- final long result = parseUInt64(currentToken);

- nextToken();

- return result;

- } catch (NumberFormatException e) {

- throw integerParseException(e);

- }

- /**

- * If the next token is a double, consume it and return its value.

- * Otherwise, throw a {@link ParseException}.

- */

- public double consumeDouble() throws ParseException {

- // We need to parse infinity and nan separately because

- // Double.parseDouble() does not accept "inf", "infinity", or "nan".

- if (DOUBLE_INFINITY.matcher(currentToken).matches()) {

- final boolean negative = currentToken.startsWith("-");

- nextToken();

- return negative ? Double.NEGATIVE_INFINITY : Double.POSITIVE_INFINITY;

- }

- if (currentToken.equalsIgnoreCase("nan")) {

- nextToken();

- return Double.NaN;

- }

- try {

- final double result = Double.parseDouble(currentToken);

- nextToken();

- return result;

- } catch (NumberFormatException e) {

- throw floatParseException(e);

- }

- /**

- * If the next token is a float, consume it and return its value.

- * Otherwise, throw a {@link ParseException}.

- */

- public float consumeFloat() throws ParseException {

- // We need to parse infinity and nan separately because

- // Float.parseFloat() does not accept "inf", "infinity", or "nan".

- if (FLOAT_INFINITY.matcher(currentToken).matches()) {

- final boolean negative = currentToken.startsWith("-");

- nextToken();

- return negative ? Float.NEGATIVE_INFINITY : Float.POSITIVE_INFINITY;

- }

- if (FLOAT_NAN.matcher(currentToken).matches()) {

- nextToken();

- return Float.NaN;

- }

- try {

- final float result = Float.parseFloat(currentToken);

- nextToken();

- return result;

- } catch (NumberFormatException e) {

- throw floatParseException(e);

- }

- /**

- * If the next token is a boolean, consume it and return its value.

- * Otherwise, throw a {@link ParseException}.

- */

- public boolean consumeBoolean() throws ParseException {

- if (currentToken.equals("true") ||

- currentToken.equals("t") ||

- currentToken.equals("1")) {

- nextToken();

- return true;

- } else if (currentToken.equals("false") ||

- currentToken.equals("f") ||

- currentToken.equals("0")) {

- nextToken();

- return false;

- } else {

- throw parseException("Expected \"true\" or \"false\".");

- }

- /**

- * If the next token is a string, consume it and return its (unescaped)

- * value. Otherwise, throw a {@link ParseException}.

- */

- public String consumeString() throws ParseException {

- return consumeByteString().toStringUtf8();

- }

- /**

- * If the next token is a string, consume it, unescape it as a

- * {@link ByteString}, and return it. Otherwise, throw a

- * {@link ParseException}.

- */

- public ByteString consumeByteString() throws ParseException {

- List<ByteString> list = new ArrayList<ByteString>();

- consumeByteString(list);

- while (currentToken.startsWith("'") || currentToken.startsWith("\"")) {

- consumeByteString(list);

- }

- return ByteString.copyFrom(list);

- }

- /**

- * Like {@link #consumeByteString()} but adds each token of the string to

- * the given list. String literals (whether bytes or text) may come in

- * multiple adjacent tokens which are automatically concatenated, like in

- * C or Python.

- */

- private void consumeByteString(List<ByteString> list) throws ParseException {

- final char quote = currentToken.length() > 0 ? currentToken.charAt(0)

- : '\0';

- if (quote != '\"' && quote != '\'') {

- throw parseException("Expected string.");

- }

- if (currentToken.length() < 2 ||

- currentToken.charAt(currentToken.length() - 1) != quote) {

- throw parseException("String missing ending quote.");

- }

- try {

- final String escaped =

- currentToken.substring(1, currentToken.length() - 1);

- final ByteString result = unescapeBytes(escaped);

- nextToken();

- list.add(result);

- } catch (InvalidEscapeSequenceException e) {

- throw parseException(e.getMessage());

- }

- /**

- * Returns a {@link ParseException} with the current line and column

- * numbers in the description, suitable for throwing.

- */

- public ParseException parseException(final String description) {

- // Note: People generally prefer one-based line and column numbers.

- return new ParseException(

- line + 1, column + 1, description);

- }

- /**

- * Returns a {@link ParseException} with the line and column numbers of

- * the previous token in the description, suitable for throwing.

- */

- public ParseException parseExceptionPreviousToken(

- final String description) {

- // Note: People generally prefer one-based line and column numbers.

- return new ParseException(

- previousLine + 1, previousColumn + 1, description);

- }

- /**

- * Constructs an appropriate {@link ParseException} for the given

- * {@code NumberFormatException} when trying to parse an integer.

- */

- private ParseException integerParseException(

- final NumberFormatException e) {

- return parseException("Couldn't parse integer: " + e.getMessage());

- }

- /**

- * Constructs an appropriate {@link ParseException} for the given

- * {@code NumberFormatException} when trying to parse a float or double.

- */

- private ParseException floatParseException(final NumberFormatException e) {

- return parseException("Couldn't parse number: " + e.getMessage());

- }

- /** Thrown when parsing an invalid text format message. */

- public static class ParseException extends IOException {

- private static final long serialVersionUID = 3196188060225107702L;

- private final int line;

- private final int column;

- /** Create a new instance, with -1 as the line and column numbers. */

- public ParseException(final String message) {

- this(-1, -1, message);

- }

- /**

- * Create a new instance

- *

- * @param line the line number where the parse error occurred,

- * using 1-offset.

- * @param column the column number where the parser error occurred,

- * using 1-offset.

- */

- public ParseException(final int line, final int column,

- final String message) {

- super(Integer.toString(line) + ":" + column + ": " + message);

- this.line = line;

- this.column = column;

- }

- /**

- * Return the line where the parse exception occurred, or -1 when

- * none is provided. The value is specified as 1-offset, so the first

- * line is line 1.

- */

- public int getLine() {

- return line;

- }

- /**

- * Return the column where the parse exception occurred, or -1 when

- * none is provided. The value is specified as 1-offset, so the first

- * line is line 1.

- */

- public int getColumn() {

- return column;

- }

- /**

- * Parse a text-format message from {@code input} and merge the contents

- * into {@code builder}.

- */

- public static void merge(final Readable input,

- final Message.Builder builder)

- throws IOException {

- merge(input, ExtensionRegistry.getEmptyRegistry(), builder);

- }

- /**

- * Parse a text-format message from {@code input} and merge the contents

- * into {@code builder}.

- */

- public static void merge(final CharSequence input,

- final Message.Builder builder)

- throws ParseException {

- merge(input, ExtensionRegistry.getEmptyRegistry(), builder);

- }

- /**

- * Parse a text-format message from {@code input} and merge the contents

- * into {@code builder}. Extensions will be recognized if they are

- * registered in {@code extensionRegistry}.

- */

- public static void merge(final Readable input,

- final ExtensionRegistry extensionRegistry,

- final Message.Builder builder)

- throws IOException {

- // Read the entire input to a String then parse that.

- // If StreamTokenizer were not quite so crippled, or if there were a kind

- // of Reader that could read in chunks that match some particular regex,

- // or if we wanted to write a custom Reader to tokenize our stream, then

- // we would not have to read to one big String. Alas, none of these is

- // the case. Oh well.

- merge(toStringBuilder(input), extensionRegistry, builder);

- }

- private static final int BUFFER_SIZE = 4096;

- // TODO(chrisn): See if working around java.io.Reader#read(CharBuffer)

- // overhead is worthwhile

- private static StringBuilder toStringBuilder(final Readable input)

- throws IOException {

- final StringBuilder text = new StringBuilder();

- final CharBuffer buffer = CharBuffer.allocate(BUFFER_SIZE);

- while (true) {

- final int n = input.read(buffer);

- if (n == -1) {

- break;

- }

- buffer.flip();

- text.append(buffer, 0, n);

- }

- return text;

- }

- /**

- * Parse a text-format message from {@code input} and merge the contents

- * into {@code builder}. Extensions will be recognized if they are

- * registered in {@code extensionRegistry}.

- */

- public static void merge(final CharSequence input,

- final ExtensionRegistry extensionRegistry,

- final Message.Builder builder)

- throws ParseException {

- final Tokenizer tokenizer = new Tokenizer(input);

- while (!tokenizer.atEnd()) {

- mergeField(tokenizer, extensionRegistry, builder);

- }

- /**

- * Parse a single field from {@code tokenizer} and merge it into

- * {@code builder}.

- */

- private static void mergeField(final Tokenizer tokenizer,

- final ExtensionRegistry extensionRegistry,

- final Message.Builder builder)

- throws ParseException {

- FieldDescriptor field;

- final Descriptor type = builder.getDescriptorForType();

- ExtensionRegistry.ExtensionInfo extension = null;

- if (tokenizer.tryConsume("[")) {

- // An extension.

- final StringBuilder name =

- new StringBuilder(tokenizer.consumeIdentifier());

- while (tokenizer.tryConsume(".")) {

- name.append('.');

- name.append(tokenizer.consumeIdentifier());

- }

- extension = extensionRegistry.findExtensionByName(name.toString());

- if (extension == null) {

- throw tokenizer.parseExceptionPreviousToken(

- "Extension \"" + name + "\" not found in the ExtensionRegistry.");

- } else if (extension.descriptor.getContainingType() != type) {

- throw tokenizer.parseExceptionPreviousToken(

- "Extension \"" + name + "\" does not extend message type \"" +

- type.getFullName() + "\".");

- }

- tokenizer.consume("]");

- field = extension.descriptor;

- } else {

- final String name = tokenizer.consumeIdentifier();

- field = type.findFieldByName(name);

- // Group names are expected to be capitalized as they appear in the

- // .proto file, which actually matches their type names, not their field

- // names.

- if (field == null) {

- // Explicitly specify US locale so that this code does not break when

- // executing in Turkey.

- final String lowerName = name.toLowerCase(Locale.US);

- field = type.findFieldByName(lowerName);

- // If the case-insensitive match worked but the field is NOT a group,

- if (field != null && field.getType() != FieldDescriptor.Type.GROUP) {

- field = null;

- }

- // Again, special-case group names as described above.

- if (field != null && field.getType() == FieldDescriptor.Type.GROUP &&

- !field.getMessageType().getName().equals(name)) {

- field = null;

- }

- if (field == null) {

- throw tokenizer.parseExceptionPreviousToken(

- "Message type \"" + type.getFullName() +

- "\" has no field named \"" + name + "\".");

- }

- Object value = null;

- if (field.getJavaType() == FieldDescriptor.JavaType.MESSAGE) {

- tokenizer.tryConsume(":"); // optional

- final String endToken;

- if (tokenizer.tryConsume("<")) {

- endToken = ">";

- } else {

- tokenizer.consume("{");

- endToken = "}";

- }

- final Message.Builder subBuilder;

- if (extension == null) {

- subBuilder = builder.newBuilderForField(field);

- } else {

- subBuilder = extension.defaultInstance.newBuilderForType();

- }

- while (!tokenizer.tryConsume(endToken)) {

- if (tokenizer.atEnd()) {

- throw tokenizer.parseException(

- "Expected \"" + endToken + "\".");

- }

- mergeField(tokenizer, extensionRegistry, subBuilder);

- }

- value = subBuilder.buildPartial();

- } else {

- tokenizer.consume(":");

- switch (field.getType()) {

- case INT32:

- case SINT32:

- case SFIXED32:

- value = tokenizer.consumeInt32();

- break;

- case INT64:

- case SINT64:

- case SFIXED64:

- value = tokenizer.consumeInt64();

- break;

- case UINT32:

- case FIXED32:

- value = tokenizer.consumeUInt32();

- break;

- case UINT64:

- case FIXED64:

- value = tokenizer.consumeUInt64();

- break;

- case FLOAT:

- value = tokenizer.consumeFloat();

- break;

- case DOUBLE:

- value = tokenizer.consumeDouble();

- break;

- case BOOL:

- value = tokenizer.consumeBoolean();

- break;

- case STRING:

- value = tokenizer.consumeString();

- break;

- case BYTES:

- value = tokenizer.consumeByteString();

- break;

- case ENUM:

- final EnumDescriptor enumType = field.getEnumType();

- if (tokenizer.lookingAtInteger()) {

- final int number = tokenizer.consumeInt32();

- value = enumType.findValueByNumber(number);

- if (value == null) {

- throw tokenizer.parseExceptionPreviousToken(

- "Enum type \"" + enumType.getFullName() +

- "\" has no value with number " + number + '.');

- }

- } else {

- final String id = tokenizer.consumeIdentifier();

- value = enumType.findValueByName(id);

- if (value == null) {

- throw tokenizer.parseExceptionPreviousToken(

- "Enum type \"" + enumType.getFullName() +

- "\" has no value named \"" + id + "\".");

- }

- break;

- case MESSAGE:

- case GROUP:

- throw new RuntimeException("Can't get here.");

- }

- if (field.isRepeated()) {

- builder.addRepeatedField(field, value);

- } else {

- builder.setField(field, value);

- }

- // =================================================================

- // Utility functions

- //

- // Some of these methods are package-private because Descriptors.java uses

- // them.

- /**

- * Escapes bytes in the format used in protocol buffer text format, which

- * is the same as the format used for C string literals. All bytes

- * that are not printable 7-bit ASCII characters are escaped, as well as

- * backslash, single-quote, and double-quote characters. Characters for

- * which no defined short-hand escape sequence is defined will be escaped

- * using 3-digit octal sequences.

- */

- static String escapeBytes(final ByteString input) {

- final StringBuilder builder = new StringBuilder(input.size());

- for (int i = 0; i < input.size(); i++) {

- final byte b = input.byteAt(i);

- switch (b) {

- // Java does not recognize \a or \v, apparently.

- case 0x07: builder.append("\\a" ); break;

- case '\b': builder.append("\\b" ); break;

- case '\f': builder.append("\\f" ); break;

- case '\n': builder.append("\\n" ); break;

- case '\r': builder.append("\\r" ); break;

- case '\t': builder.append("\\t" ); break;

- case 0x0b: builder.append("\\v" ); break;

- case '\\': builder.append("\\\\"); break;

- case '\'': builder.append("\\\'"); break;

- case '"' : builder.append("\\\""); break;

- default:

- // Note: Bytes with the high-order bit set should be escaped. Since

- // bytes are signed, such bytes will compare less than 0x20, hence

- // the following line is correct.

- if (b >= 0x20) {

- builder.append((char) b);

- } else {

- builder.append('\\');

- builder.append((char) ('0' + ((b >>> 6) & 3)));

- builder.append((char) ('0' + ((b >>> 3) & 7)));

- builder.append((char) ('0' + (b & 7)));

- }

- break;

- }

- return builder.toString();

- }

- /**

- * Un-escape a byte sequence as escaped using

- * {@link #escapeBytes(ByteString)}. Two-digit hex escapes (starting with

- * "\x") are also recognized.

- */

- static ByteString unescapeBytes(final CharSequence charString)

- throws InvalidEscapeSequenceException {

- // First convert the Java character sequence to UTF-8 bytes.

- ByteString input = ByteString.copyFromUtf8(charString.toString());

- // Then unescape certain byte sequences introduced by ASCII '\\'. The valid

- // escapes can all be expressed with ASCII characters, so it is safe to

- // operate on bytes here.

- //

- // Unescaping the input byte array will result in a byte sequence that's no

- // longer than the input. That's because each escape sequence is between

- // two and four bytes long and stands for a single byte.

- final byte[] result = new byte[input.size()];

- int pos = 0;

- for (int i = 0; i < input.size(); i++) {

- byte c = input.byteAt(i);

- if (c == '\\') {

- if (i + 1 < input.size()) {

- ++i;

- c = input.byteAt(i);

- if (isOctal(c)) {

- // Octal escape.

- int code = digitValue(c);

- if (i + 1 < input.size() && isOctal(input.byteAt(i + 1))) {

- ++i;

- code = code * 8 + digitValue(input.byteAt(i));

- }

- if (i + 1 < input.size() && isOctal(input.byteAt(i + 1))) {

- ++i;

- code = code * 8 + digitValue(input.byteAt(i));

- }

- // TODO: Check that 0 <= code && code <= 0xFF.

- result[pos++] = (byte)code;

- } else {

- switch (c) {

- case 'a' : result[pos++] = 0x07; break;

- case 'b' : result[pos++] = '\b'; break;

- case 'f' : result[pos++] = '\f'; break;

- case 'n' : result[pos++] = '\n'; break;

- case 'r' : result[pos++] = '\r'; break;

- case 't' : result[pos++] = '\t'; break;

- case 'v' : result[pos++] = 0x0b; break;

- case '\\': result[pos++] = '\\'; break;

- case '\'': result[pos++] = '\''; break;

- case '"' : result[pos++] = '\"'; break;

- case 'x':

- // hex escape

- int code = 0;

- if (i + 1 < input.size() && isHex(input.byteAt(i + 1))) {

- ++i;

- code = digitValue(input.byteAt(i));

- } else {

- throw new InvalidEscapeSequenceException(

- "Invalid escape sequence: '\\x' with no digits");

- }

- if (i + 1 < input.size() && isHex(input.byteAt(i + 1))) {

- ++i;

- code = code * 16 + digitValue(input.byteAt(i));

- }

- result[pos++] = (byte)code;

- break;

- default:

- throw new InvalidEscapeSequenceException(

- "Invalid escape sequence: '\\" + (char)c + '\'');

- }

- } else {

- throw new InvalidEscapeSequenceException(

- "Invalid escape sequence: '\\' at end of string.");

- }

- } else {

- result[pos++] = c;

- }

- return ByteString.copyFrom(result, 0, pos);

- }

- /**

- * Thrown by {@link TextFormat#unescapeBytes} and

- * {@link TextFormat#unescapeText} when an invalid escape sequence is seen.

- */

- static class InvalidEscapeSequenceException extends IOException {

- private static final long serialVersionUID = -8164033650142593304L;

- InvalidEscapeSequenceException(final String description) {

- super(description);

- }

- /**

- * Like {@link #escapeBytes(ByteString)}, but escapes a text string.

- * Non-ASCII characters are first encoded as UTF-8, then each byte is escaped

- * individually as a 3-digit octal escape. Yes, it's weird.

- */

- static String escapeText(final String input) {

- return escapeBytes(ByteString.copyFromUtf8(input));

- }

- /**

- * Un-escape a text string as escaped using {@link #escapeText(String)}.

- * Two-digit hex escapes (starting with "\x") are also recognized.

- */

- static String unescapeText(final String input)

- throws InvalidEscapeSequenceException {

- return unescapeBytes(input).toStringUtf8();

- }

- /** Is this an octal digit? */

- private static boolean isOctal(final byte c) {

- return '0' <= c && c <= '7';

- }

- /** Is this a hex digit? */

- private static boolean isHex(final byte c) {

- return ('0' <= c && c <= '9') ||

- ('a' <= c && c <= 'f') ||

- ('A' <= c && c <= 'F');

- }

- /**

- * Interpret a character as a digit (in any base up to 36) and return the

- * numeric value. This is like {@code Character.digit()} but we don't accept

- * non-ASCII digits.

- */

- private static int digitValue(final byte c) {

- if ('0' <= c && c <= '9') {

- return c - '0';

- } else if ('a' <= c && c <= 'z') {

- return c - 'a' + 10;

- } else {

- return c - 'A' + 10;

- }

- /**

- * Parse a 32-bit signed integer from the text. Unlike the Java standard

- * {@code Integer.parseInt()}, this function recognizes the prefixes "0x"

- * and "0" to signify hexadecimal and octal numbers, respectively.

- */

- static int parseInt32(final String text) throws NumberFormatException {

- return (int) parseInteger(text, true, false);

- }

- /**

- * Parse a 32-bit unsigned integer from the text. Unlike the Java standard

- * {@code Integer.parseInt()}, this function recognizes the prefixes "0x"

- * and "0" to signify hexadecimal and octal numbers, respectively. The

- * result is coerced to a (signed) {@code int} when returned since Java has

- * no unsigned integer type.

- */

- static int parseUInt32(final String text) throws NumberFormatException {

- return (int) parseInteger(text, false, false);

- }

- /**

- * Parse a 64-bit signed integer from the text. Unlike the Java standard

- * {@code Integer.parseInt()}, this function recognizes the prefixes "0x"

- * and "0" to signify hexadecimal and octal numbers, respectively.

- */

- static long parseInt64(final String text) throws NumberFormatException {

- return parseInteger(text, true, true);

- }

- /**

- * Parse a 64-bit unsigned integer from the text. Unlike the Java standard

- * {@code Integer.parseInt()}, this function recognizes the prefixes "0x"

- * and "0" to signify hexadecimal and octal numbers, respectively. The

- * result is coerced to a (signed) {@code long} when returned since Java has

- * no unsigned long type.

- */

- static long parseUInt64(final String text) throws NumberFormatException {

- return parseInteger(text, false, true);

- }

- private static long parseInteger(final String text,

- final boolean isSigned,

- final boolean isLong)

- throws NumberFormatException {

- int pos = 0;

- boolean negative = false;

- if (text.startsWith("-", pos)) {

- if (!isSigned) {

- throw new NumberFormatException("Number must be positive: " + text);

- }

- ++pos;

- negative = true;

- }

- int radix = 10;

- if (text.startsWith("0x", pos)) {

- pos += 2;

- radix = 16;

- } else if (text.startsWith("0", pos)) {

- radix = 8;

- }

- final String numberText = text.substring(pos);

- long result = 0;

- if (numberText.length() < 16) {

- // Can safely assume no overflow.

- result = Long.parseLong(numberText, radix);

- if (negative) {

- result = -result;

- }

- // Check bounds.

- // No need to check for 64-bit numbers since they'd have to be 16 chars

- // or longer to overflow.

- if (!isLong) {

- if (isSigned) {

- if (result > Integer.MAX_VALUE || result < Integer.MIN_VALUE) {

- throw new NumberFormatException(

- "Number out of range for 32-bit signed integer: " + text);

- }

- } else {

- if (result >= (1L << 32) || result < 0) {

- throw new NumberFormatException(

- "Number out of range for 32-bit unsigned integer: " + text);

- }

- } else {

- BigInteger bigValue = new BigInteger(numberText, radix);

- if (negative) {

- bigValue = bigValue.negate();

- }

- // Check bounds.

- if (!isLong) {

- if (isSigned) {

- if (bigValue.bitLength() > 31) {

- throw new NumberFormatException(

- "Number out of range for 32-bit signed integer: " + text);

- }

- } else {

- if (bigValue.bitLength() > 32) {

- throw new NumberFormatException(

- "Number out of range for 32-bit unsigned integer: " + text);

- }

- } else {

- if (isSigned) {

- if (bigValue.bitLength() > 63) {

- throw new NumberFormatException(

- "Number out of range for 64-bit signed integer: " + text);

- }

- } else {

- if (bigValue.bitLength() > 64) {

- throw new NumberFormatException(

- "Number out of range for 64-bit unsigned integer: " + text);

- }

- result = bigValue.longValue();

- }

- return result;

- }