Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(553)

Side by Side Diff: base/strings/string_split.h

Issue 1641513004: Update //base to chromium 9659b08ea5a34f889dc4166217f438095ddc10d2 (Closed) Base URL: git@github.com:domokit/mojo.git@master
Patch Set: Created 4 years, 10 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« no previous file with comments | « base/strings/string_piece.h ('k') | base/strings/string_split.cc » ('j') | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be 2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file. 3 // found in the LICENSE file.
4 4
5 #ifndef BASE_STRINGS_STRING_SPLIT_H_ 5 #ifndef BASE_STRINGS_STRING_SPLIT_H_
6 #define BASE_STRINGS_STRING_SPLIT_H_ 6 #define BASE_STRINGS_STRING_SPLIT_H_
7 7
8 #include <string> 8 #include <string>
9 #include <utility> 9 #include <utility>
10 #include <vector> 10 #include <vector>
11 11
12 #include "base/base_export.h" 12 #include "base/base_export.h"
13 #include "base/strings/string16.h" 13 #include "base/strings/string16.h"
14 #include "base/strings/string_piece.h"
14 15
15 namespace base { 16 namespace base {
16 17
17 // Splits |str| into a vector of strings delimited by |c|, placing the results 18 enum WhitespaceHandling {
18 // in |r|. If several instances of |c| are contiguous, or if |str| begins with 19 KEEP_WHITESPACE,
19 // or ends with |c|, then an empty string is inserted. 20 TRIM_WHITESPACE,
21 };
22
23 enum SplitResult {
24 // Strictly return all results.
25 //
26 // If the input is ",," and the separator is ',' this will return a
27 // vector of three empty strings.
28 SPLIT_WANT_ALL,
29
30 // Only nonempty results will be added to the results. Multiple separators
31 // will be coalesced. Separators at the beginning and end of the input will
32 // be ignored. With TRIM_WHITESPACE, whitespace-only results will be dropped.
33 //
34 // If the input is ",," and the separator is ',', this will return an empty
35 // vector.
36 SPLIT_WANT_NONEMPTY,
37 };
38
39 // Split the given string on ANY of the given separators, returning copies of
40 // the result.
20 // 41 //
21 // Every substring is trimmed of any leading or trailing white space. 42 // To split on either commas or semicolons, keeping all whitespace:
22 // NOTE: |c| must be in BMP (Basic Multilingual Plane) 43 //
23 BASE_EXPORT void SplitString(const string16& str, 44 // std::vector<std::string> tokens = base::SplitString(
24 char16 c, 45 // input, ",;", base::KEEP_WHITESPACE, base::SPLIT_WANT_ALL);
25 std::vector<string16>* r); 46 BASE_EXPORT std::vector<std::string> SplitString(StringPiece input,
47 StringPiece separators,
48 WhitespaceHandling whitespace,
49 SplitResult result_type);
50 BASE_EXPORT std::vector<string16> SplitString(StringPiece16 input,
51 StringPiece16 separators,
52 WhitespaceHandling whitespace,
53 SplitResult result_type);
26 54
27 // |str| should not be in a multi-byte encoding like Shift-JIS or GBK in which 55 // Like SplitString above except it returns a vector of StringPieces which
28 // the trailing byte of a multi-byte character can be in the ASCII range. 56 // reference the original buffer without copying. Although you have to be
29 // UTF-8, and other single/multi-byte ASCII-compatible encodings are OK. 57 // careful to keep the original string unmodified, this provides an efficient
30 // Note: |c| must be in the ASCII range. 58 // way to iterate through tokens in a string.
31 BASE_EXPORT void SplitString(const std::string& str, 59 //
32 char c, 60 // To iterate through all whitespace-separated tokens in an input string:
33 std::vector<std::string>* r); 61 //
62 // for (const auto& cur :
63 // base::SplitStringPiece(input, base::kWhitespaceASCII,
64 // base::KEEP_WHITESPACE,
65 // base::SPLIT_WANT_NONEMPTY)) {
66 // ...
67 BASE_EXPORT std::vector<StringPiece> SplitStringPiece(
68 StringPiece input,
69 StringPiece separators,
70 WhitespaceHandling whitespace,
71 SplitResult result_type);
72 BASE_EXPORT std::vector<StringPiece16> SplitStringPiece(
73 StringPiece16 input,
74 StringPiece16 separators,
75 WhitespaceHandling whitespace,
76 SplitResult result_type);
34 77
35 typedef std::vector<std::pair<std::string, std::string> > StringPairs; 78 using StringPairs = std::vector<std::pair<std::string, std::string>>;
36 79
37 // Splits |line| into key value pairs according to the given delimiters and 80 // Splits |line| into key value pairs according to the given delimiters and
38 // removes whitespace leading each key and trailing each value. Returns true 81 // removes whitespace leading each key and trailing each value. Returns true
39 // only if each pair has a non-empty key and value. |key_value_pairs| will 82 // only if each pair has a non-empty key and value. |key_value_pairs| will
40 // include ("","") pairs for entries without |key_value_delimiter|. 83 // include ("","") pairs for entries without |key_value_delimiter|.
41 BASE_EXPORT bool SplitStringIntoKeyValuePairs(const std::string& line, 84 BASE_EXPORT bool SplitStringIntoKeyValuePairs(const std::string& line,
42 char key_value_delimiter, 85 char key_value_delimiter,
43 char key_value_pair_delimiter, 86 char key_value_pair_delimiter,
44 StringPairs* key_value_pairs); 87 StringPairs* key_value_pairs);
45 88
46 // The same as SplitString, but use a substring delimiter instead of a char. 89 // Similar to SplitString, but use a substring delimiter instead of a list of
90 // characters that are all possible delimiters.
91 //
92 // TODO(brettw) this should probably be changed and expanded to provide a
93 // mirror of the SplitString[Piece] API above, just with the different
94 // delimiter handling.
47 BASE_EXPORT void SplitStringUsingSubstr(const string16& str, 95 BASE_EXPORT void SplitStringUsingSubstr(const string16& str,
48 const string16& s, 96 const string16& s,
49 std::vector<string16>* r); 97 std::vector<string16>* r);
50 BASE_EXPORT void SplitStringUsingSubstr(const std::string& str, 98 BASE_EXPORT void SplitStringUsingSubstr(const std::string& str,
51 const std::string& s, 99 const std::string& s,
52 std::vector<std::string>* r); 100 std::vector<std::string>* r);
53 101
102 // -----------------------------------------------------------------------------
103 // Backwards-compat wrappers
104 //
105 // New code should use one of the more general variants above.
106 // TODO(brettw) remove these and convert to the versions above.
107
108 // Splits |str| into a vector of strings delimited by |c|, placing the results
109 // in |r|. If several instances of |c| are contiguous, or if |str| begins with
110 // or ends with |c|, then an empty string is inserted.
111 //
112 // Every substring is trimmed of any leading or trailing white space.
113 // NOTE: |c| must be in BMP (Basic Multilingual Plane)
114 BASE_EXPORT void SplitString(const string16& str,
115 char16 c,
116 std::vector<string16>* r);
117
118 // |str| should not be in a multi-byte encoding like Shift-JIS or GBK in which
119 // the trailing byte of a multi-byte character can be in the ASCII range.
120 // UTF-8, and other single/multi-byte ASCII-compatible encodings are OK.
121 // Note: |c| must be in the ASCII range.
122 BASE_EXPORT void SplitString(const std::string& str,
123 char c,
124 std::vector<std::string>* r);
125
54 // The same as SplitString, but don't trim white space. 126 // The same as SplitString, but don't trim white space.
55 // NOTE: |c| must be in BMP (Basic Multilingual Plane) 127 // NOTE: |c| must be in BMP (Basic Multilingual Plane)
56 BASE_EXPORT void SplitStringDontTrim(const string16& str, 128 BASE_EXPORT void SplitStringDontTrim(StringPiece16 str,
57 char16 c, 129 char16 c,
58 std::vector<string16>* r); 130 std::vector<string16>* r);
59 // |str| should not be in a multi-byte encoding like Shift-JIS or GBK in which 131 // |str| should not be in a multi-byte encoding like Shift-JIS or GBK in which
60 // the trailing byte of a multi-byte character can be in the ASCII range. 132 // the trailing byte of a multi-byte character can be in the ASCII range.
61 // UTF-8, and other single/multi-byte ASCII-compatible encodings are OK. 133 // UTF-8, and other single/multi-byte ASCII-compatible encodings are OK.
62 // Note: |c| must be in the ASCII range. 134 // Note: |c| must be in the ASCII range.
63 BASE_EXPORT void SplitStringDontTrim(const std::string& str, 135 BASE_EXPORT void SplitStringDontTrim(StringPiece str,
64 char c, 136 char c,
65 std::vector<std::string>* r); 137 std::vector<std::string>* result);
66 138
67 // WARNING: this uses whitespace as defined by the HTML5 spec. If you need 139 // WARNING: this uses whitespace as defined by the HTML5 spec (ASCII whitespace
68 // a function similar to this but want to trim all types of whitespace, then 140 // only).
69 // factor this out into a function that takes a string containing the characters
70 // that are treated as whitespace.
71 // 141 //
72 // Splits the string along whitespace (where whitespace is the five space 142 // The difference between this and calling SplitString with the whitespace
73 // characters defined by HTML 5). Each contiguous block of non-whitespace 143 // characters as separators is the treatment of the first element when the
74 // characters is added to result. 144 // string starts with whitespace.
145 //
146 // Input SplitString SplitStringAlongWhitespace
147 // --------------------------------------------------------
148 // " a " "", "a" "a"
75 BASE_EXPORT void SplitStringAlongWhitespace(const string16& str, 149 BASE_EXPORT void SplitStringAlongWhitespace(const string16& str,
76 std::vector<string16>* result); 150 std::vector<string16>* result);
77 BASE_EXPORT void SplitStringAlongWhitespace(const std::string& str, 151 BASE_EXPORT void SplitStringAlongWhitespace(const std::string& str,
78 std::vector<std::string>* result); 152 std::vector<std::string>* result);
79 153
80 } // namespace base 154 } // namespace base
81 155
82 #endif // BASE_STRINGS_STRING_SPLIT_H_ 156 #endif // BASE_STRINGS_STRING_SPLIT_H_
OLDNEW
« no previous file with comments | « base/strings/string_piece.h ('k') | base/strings/string_split.cc » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698