Index: tools/gn/string_utils.cc |
diff --git a/tools/gn/string_utils.cc b/tools/gn/string_utils.cc |
new file mode 100644 |
index 0000000000000000000000000000000000000000..14d296a51e2bc727ffd59194beae1d09053ad645 |
--- /dev/null |
+++ b/tools/gn/string_utils.cc |
@@ -0,0 +1,168 @@ |
+// Copyright (c) 2013 The Chromium Authors. All rights reserved. |
+// Use of this source code is governed by a BSD-style license that can be |
+// found in the LICENSE file. |
+ |
+#include "tools/gn/string_utils.h" |
+ |
+#include "tools/gn/err.h" |
+#include "tools/gn/scope.h" |
+#include "tools/gn/token.h" |
+#include "tools/gn/tokenizer.h" |
+#include "tools/gn/value.h" |
+ |
+namespace { |
+ |
+// Constructs an Err indicating a range inside a string. We assume that the |
+// token has quotes around it that are not counted by the offset. |
+Err ErrInsideStringToken(const Token& token, size_t offset, size_t size, |
+ const std::string& msg, |
+ const std::string& help = std::string()) { |
+ // The "+1" is skipping over the " at the beginning of the token. |
+ Location begin_loc(token.location().file(), |
+ token.location().line_number(), |
+ token.location().char_offset() + offset + 1); |
+ Location end_loc(token.location().file(), |
+ token.location().line_number(), |
+ token.location().char_offset() + offset + 1 + size); |
+ return Err(LocationRange(begin_loc, end_loc), msg, help); |
+} |
+ |
+// Given the character input[i] indicating the $ in a string, locates the |
+// identifier and places its range in |*identifier|, and updates |*i| to |
+// point to the last character consumed. |
+// |
+// On error returns false and sets the error. |
+bool LocateInlineIdenfitier(const Token& token, |
+ const char* input, size_t size, |
+ size_t* i, |
+ base::StringPiece* identifier, |
+ Err* err) { |
+ size_t dollars_index = *i; |
+ (*i)++; |
+ if (*i == size) { |
+ *err = ErrInsideStringToken(token, dollars_index, 1, "$ at end of string.", |
+ "I was expecting an identifier after the $."); |
+ return false; |
+ } |
+ |
+ bool has_brackets; |
+ if (input[*i] == '{') { |
+ (*i)++; |
+ if (*i == size) { |
+ *err = ErrInsideStringToken(token, dollars_index, 2, |
+ "${ at end of string.", |
+ "I was expecting an identifier inside the ${...}."); |
+ return false; |
+ } |
+ has_brackets = true; |
+ } else { |
+ has_brackets = false; |
+ } |
+ |
+ // First char is special. |
+ if (!Tokenizer::IsIdentifierFirstChar(input[*i])) { |
+ *err = ErrInsideStringToken( |
+ token, dollars_index, *i - dollars_index + 1, |
+ "$ not followed by an identifier char.", |
+ "It you want a literal $ use \"\\$\"."); |
+ return false; |
+ } |
+ size_t begin_offset = *i; |
+ (*i)++; |
+ |
+ // Find the first non-identifier char following the string. |
+ while (*i < size && Tokenizer::IsIdentifierContinuingChar(input[*i])) |
+ (*i)++; |
+ size_t end_offset = *i; |
+ |
+ // If we started with a bracket, validate that there's an ending one. Leave |
+ // *i pointing to the last char we consumed (backing up one). |
+ if (has_brackets) { |
+ if (*i == size) { |
+ *err = ErrInsideStringToken(token, dollars_index, *i - dollars_index, |
+ "Unterminated ${..."); |
+ return false; |
+ } else if (input[*i] != '}') { |
+ *err = ErrInsideStringToken(token, *i, 1, "Not an identifier in string expansion.", |
+ "The contents of ${...} should be an identifier. " |
+ "This character is out of sorts."); |
+ return false; |
+ } |
+ // We want to consume the bracket but also back up one, so *i is unchanged. |
+ } else { |
+ (*i)--; |
+ } |
+ |
+ *identifier = base::StringPiece(&input[begin_offset], |
+ end_offset - begin_offset); |
+ return true; |
+} |
+ |
+bool AppendIdentifierValue(Scope* scope, |
+ const Token& token, |
+ const base::StringPiece& identifier, |
+ std::string* output, |
+ Err* err) { |
+ const Value* value = scope->GetValue(identifier, true); |
+ if (!value) { |
+ // We assume the identifier points inside the token. |
+ *err = ErrInsideStringToken( |
+ token, identifier.data() - token.value().data() - 1, identifier.size(), |
+ "Undefined identifier in string expansion.", |
+ std::string("\"") + identifier + "\" is not currently in scope."); |
+ return false; |
+ } |
+ |
+ output->append(value->ToString()); |
+ return true; |
+} |
+ |
+} // namespace |
+ |
+bool ExpandStringLiteral(Scope* scope, |
+ const Token& literal, |
+ Value* result, |
+ Err* err) { |
+ DCHECK(literal.type() == Token::STRING); |
+ DCHECK(literal.value().size() > 1); // Should include quotes. |
+ DCHECK(result->type() == Value::STRING); // Should be already set. |
+ |
+ // The token includes the surrounding quotes, so strip those off. |
+ const char* input = &literal.value().data()[1]; |
+ size_t size = literal.value().size() - 2; |
+ |
+ std::string& output = result->string_value(); |
+ output.reserve(size); |
+ for (size_t i = 0; i < size; i++) { |
+ if (input[i] == '\\') { |
+ if (i < size - 1) { |
+ switch (input[i + 1]) { |
+ case '\\': |
+ case '"': |
+ case '$': |
+ output.push_back(input[i + 1]); |
+ i++; |
+ continue; |
+ default: // Everything else has no meaning: pass the literal. |
+ break; |
+ } |
+ } |
+ output.push_back(input[i]); |
+ } else if (input[i] == '$') { |
+ base::StringPiece identifier; |
+ if (!LocateInlineIdenfitier(literal, input, size, &i, &identifier, err)) |
+ return false; |
+ if (!AppendIdentifierValue(scope, literal, identifier, &output, err)) |
+ return false; |
+ } else { |
+ output.push_back(input[i]); |
+ } |
+ } |
+ return true; |
+} |
+ |
+std::string RemovePrefix(const std::string& str, const std::string& prefix) { |
+ CHECK(str.size() >= prefix.size() && |
+ str.compare(0, prefix.size(), prefix) == 0); |
+ return str.substr(prefix.size()); |
+} |