Chromium Code Reviews| OLD | NEW |
|---|---|
| 1 // Copyright 2016 The Chromium Authors. All rights reserved. | 1 // Copyright 2016 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
| 4 | 4 |
| 5 #ifndef WTF_StringView_h | 5 #ifndef WTF_StringView_h |
| 6 #define WTF_StringView_h | 6 #define WTF_StringView_h |
| 7 | 7 |
| 8 #include "wtf/Allocator.h" | 8 #include "wtf/Allocator.h" |
| 9 #include "wtf/GetPtr.h" | |
| 9 #if DCHECK_IS_ON() | 10 #if DCHECK_IS_ON() |
| 10 #include "wtf/RefPtr.h" | 11 #include "wtf/RefPtr.h" |
| 11 #endif | 12 #endif |
| 12 #include "wtf/text/AtomicString.h" | 13 #include "wtf/text/AtomicString.h" |
| 13 #include "wtf/text/StringImpl.h" | 14 #include "wtf/text/StringImpl.h" |
| 14 #include "wtf/text/Unicode.h" | 15 #include "wtf/text/Unicode.h" |
| 15 #include "wtf/text/WTFString.h" | 16 #include "wtf/text/WTFString.h" |
| 16 #include <cstring> | 17 #include <cstring> |
| 17 | 18 |
| 18 namespace WTF { | 19 namespace WTF { |
| 19 | 20 |
| 20 // A string like object that wraps either an 8bit or 16bit byte sequence | 21 // A string like object that wraps either an 8bit or 16bit byte sequence |
| 21 // and keeps track of the length and the type, it does NOT own the bytes. | 22 // and keeps track of the length and the type, it does NOT own the bytes. |
| 22 // | 23 // |
| 23 // Since StringView does not own the bytes creating a StringView from a String, | 24 // Since StringView does not own the bytes creating a StringView from a String, |
| 24 // then calling clear() on the string will result in a use-after-free. Asserts | 25 // then calling clear() on the String will result in a use-after-free. Asserts |
| 25 // in ~StringView attempt to enforce this for most common cases. | 26 // in ~StringView attempt to enforce this for most common cases. |
| 26 // | 27 // |
| 27 // See base/strings/string_piece.h for more details. | 28 // See base/strings/string_piece.h for more details. |
| 28 class WTF_EXPORT StringView { | 29 class WTF_EXPORT StringView { |
| 29 DISALLOW_NEW_EXCEPT_PLACEMENT_NEW(); | 30 DISALLOW_NEW_EXCEPT_PLACEMENT_NEW(); |
| 30 public: | 31 public: |
| 31 // Null string. | 32 // Null string. |
| 32 StringView() { clear(); } | 33 StringView() { clear(); } |
| 33 | 34 |
| 34 // From a StringView: | 35 // From a StringView: |
| 35 StringView(const StringView&, unsigned offset, unsigned length); | 36 StringView(const StringView&, unsigned offset, unsigned length); |
| 36 StringView(const StringView& view, unsigned offset) | 37 StringView(const StringView& view, unsigned offset) |
| 37 : StringView(view, offset, view.m_length - offset) {} | 38 : StringView(view, offset, view.m_length - offset) {} |
| 38 | 39 |
| 39 // From a StringImpl: | 40 // From a StringImpl: |
| 40 StringView(StringImpl*); | 41 StringView(StringImpl*); |
| 41 StringView(StringImpl*, unsigned offset); | 42 StringView(StringImpl*, unsigned offset); |
| 42 StringView(StringImpl*, unsigned offset, unsigned length); | 43 StringView(StringImpl*, unsigned offset, unsigned length); |
| 43 | 44 |
| 44 // From a String: | 45 // From a String: |
| 45 StringView(const String& string, unsigned offset, unsigned length) | 46 StringView(const String& string, unsigned offset, unsigned length) |
| 46 : StringView(string.impl(), offset, length) {} | 47 : StringView(string.impl(), offset, length) {} |
| 47 StringView(const String& string, unsigned offset) | 48 StringView(const String& string, unsigned offset) |
| 48 : StringView(string.impl(), offset) {} | 49 : StringView(string.impl(), offset) {} |
| 49 StringView(const String& string) | 50 StringView(const String& string) |
| 50 : StringView(string, 0, string.length()) {} | 51 : StringView(string.impl()) {} |
| 51 | 52 |
| 52 // From an AtomicString: | 53 // From an AtomicString: |
| 53 StringView(const AtomicString& string, unsigned offset, unsigned length) | 54 StringView(const AtomicString& string, unsigned offset, unsigned length) |
| 54 : StringView(string.impl(), offset, length) {} | 55 : StringView(string.impl(), offset, length) {} |
| 55 StringView(const AtomicString& string, unsigned offset) | 56 StringView(const AtomicString& string, unsigned offset) |
| 56 : StringView(string.impl(), offset) {} | 57 : StringView(string.impl(), offset) {} |
| 57 StringView(const AtomicString& string) | 58 StringView(const AtomicString& string) |
| 58 : StringView(string, 0, string.length()) {} | 59 : StringView(string.impl()) {} |
| 59 | 60 |
| 60 // From a literal string or LChar buffer: | 61 // From a literal string or LChar buffer: |
| 61 StringView(const LChar* chars, unsigned length); | 62 StringView(const LChar* chars, unsigned length) |
| 63 : StringView(reinterpret_cast<const void*>(chars), length, true) {} | |
| 62 StringView(const char* chars, unsigned length) | 64 StringView(const char* chars, unsigned length) |
| 63 : StringView(reinterpret_cast<const LChar*>(chars), length) {} | 65 : StringView(reinterpret_cast<const LChar*>(chars), length) {} |
| 64 StringView(const LChar* chars) | 66 StringView(const LChar* chars) |
| 65 : StringView(chars, chars ? strlen(reinterpret_cast<const char*>(chars)) : 0) {} | 67 : StringView(chars, chars ? strlen(reinterpret_cast<const char*>(chars)) : 0) {} |
| 66 StringView(const char* chars) | 68 StringView(const char* chars) |
| 67 : StringView(reinterpret_cast<const LChar*>(chars)) {} | 69 : StringView(reinterpret_cast<const LChar*>(chars)) {} |
| 68 | 70 |
| 69 // From a wide literal string or UChar buffer. | 71 // From a wide literal string or UChar buffer. |
| 72 StringView(const UChar* chars, unsigned length) | |
| 73 : StringView(reinterpret_cast<const void*>(chars), length, false) {} | |
| 70 StringView(const UChar* chars); | 74 StringView(const UChar* chars); |
| 71 StringView(const UChar* chars, unsigned length); | |
| 72 | 75 |
| 73 // From a byte pointer. | 76 // From a byte pointer. |
| 74 StringView(const void* bytes, unsigned length, bool is8Bit) | 77 StringView(const void* bytes, unsigned length, bool is8Bit) |
| 75 : m_length(length) | 78 : m_impl(is8Bit ? StringImpl::empty() : StringImpl::empty16Bit()) |
| 76 , m_is8Bit(is8Bit) | 79 , m_bytes(bytes) |
| 77 { | 80 , m_length(length) {} |
| 78 m_data.bytes = bytes; | |
| 79 } | |
| 80 | 81 |
| 81 #if DCHECK_IS_ON() | 82 #if DCHECK_IS_ON() |
| 82 ~StringView(); | 83 ~StringView(); |
| 83 #endif | 84 #endif |
| 84 | 85 |
| 85 bool isNull() const { return !m_data.bytes; } | 86 bool isNull() const { return !m_bytes; } |
| 86 bool isEmpty() const { return !m_length; } | 87 bool isEmpty() const { return !m_length; } |
| 87 | 88 |
| 88 unsigned length() const { return m_length; } | 89 unsigned length() const { return m_length; } |
| 89 | 90 |
| 90 bool is8Bit() const { return m_is8Bit; } | 91 bool is8Bit() const { DCHECK(m_impl); return m_impl->is8Bit(); } |
| 91 | 92 |
| 92 void clear(); | 93 void clear(); |
| 93 | 94 |
| 94 UChar operator[](unsigned i) const | 95 UChar operator[](unsigned i) const |
| 95 { | 96 { |
| 96 SECURITY_DCHECK(i < length()); | 97 SECURITY_DCHECK(i < length()); |
| 97 if (is8Bit()) | 98 if (is8Bit()) |
| 98 return characters8()[i]; | 99 return characters8()[i]; |
| 99 return characters16()[i]; | 100 return characters16()[i]; |
| 100 } | 101 } |
| 101 | 102 |
| 102 const LChar* characters8() const | 103 const LChar* characters8() const |
| 103 { | 104 { |
| 104 ASSERT(is8Bit()); | 105 DCHECK(is8Bit()); |
| 105 return m_data.characters8; | 106 return m_characters8; |
| 106 } | 107 } |
| 107 | 108 |
| 108 const UChar* characters16() const | 109 const UChar* characters16() const |
| 109 { | 110 { |
| 110 ASSERT(!is8Bit()); | 111 DCHECK(!is8Bit()); |
| 111 return m_data.characters16; | 112 return m_characters16; |
| 112 } | 113 } |
| 113 | 114 |
| 114 const void* bytes() const { return m_data.bytes; } | 115 const void* bytes() const { return m_bytes; } |
| 116 | |
| 117 // This is not named impl() like String because it has different semantics. | |
| 118 // String::impl() is never null if String::isNull() is false. For StringView | |
| 119 // sharedImpl() can be null if the StringView was created with a non-zero | |
| 120 // offset, or a length that made it shorter than the underlying impl. | |
| 121 StringImpl* sharedImpl() const | |
| 122 { | |
| 123 // If this StringView is backed by a StringImpl, and was constructed | |
| 124 // with a zero offset and the same length we can just access the impl | |
| 125 // directly since this == StringView(m_impl). | |
| 126 if (m_impl->bytes() == bytes() && m_length == m_impl->length()) | |
|
haraken
2016/06/06 02:28:52
Would you help me understand why do you need to ch
esprehn
2016/06/06 04:42:21
A StringView can be a shorter length than the unde
| |
| 127 return getPtr(m_impl); | |
| 128 return nullptr; | |
| 129 } | |
| 115 | 130 |
| 116 String toString() const; | 131 String toString() const; |
| 117 AtomicString toAtomicString() const; | 132 AtomicString toAtomicString() const; |
| 118 | 133 |
| 119 private: | 134 private: |
| 120 void set(StringImpl&, unsigned offset, unsigned length); | 135 void set(StringImpl&, unsigned offset, unsigned length); |
| 121 | 136 |
| 137 // We use the StringImpl to mark for 8bit or 16bit, even for strings where | |
| 138 // we were constructed from a char pointer. So m_impl->bytes() might have | |
| 139 // nothing to do with this view's bytes(). | |
| 122 #if DCHECK_IS_ON() | 140 #if DCHECK_IS_ON() |
| 123 RefPtr<StringImpl> m_impl; | 141 RefPtr<StringImpl> m_impl; |
| 142 #else | |
| 143 StringImpl* m_impl; | |
|
haraken
2016/06/06 02:28:52
Who guarantees that someone else keeps a reference
esprehn
2016/06/06 04:42:21
The caller does, this is the same as base::StringP
haraken
2016/06/06 05:02:35
Thanks for the details. Makes sense.
The assertio
| |
| 124 #endif | 144 #endif |
| 125 union DataUnion { | 145 union { |
| 126 const LChar* characters8; | 146 const LChar* m_characters8; |
| 127 const UChar* characters16; | 147 const UChar* m_characters16; |
| 128 const void* bytes; | 148 const void* m_bytes; |
|
haraken
2016/06/06 02:28:52
Worth adding a comment that how each of the fields
esprehn
2016/06/06 04:42:21
This is the same as String's semantics. In the nex
haraken
2016/06/06 05:02:35
That sounds great.
| |
| 129 } m_data; | 149 }; |
| 130 unsigned m_length; | 150 unsigned m_length; |
| 131 unsigned m_is8Bit : 1; | |
| 132 }; | 151 }; |
| 133 | 152 |
| 134 inline StringView::StringView(const StringView& view, unsigned offset, unsigned length) | 153 inline StringView::StringView(const StringView& view, unsigned offset, unsigned length) |
| 135 : m_length(length) | 154 : m_impl(view.m_impl) |
| 136 , m_is8Bit(view.is8Bit()) | 155 , m_length(length) |
| 137 { | 156 { |
| 138 SECURITY_DCHECK(offset + length <= view.length()); | 157 SECURITY_DCHECK(offset + length <= view.length()); |
| 139 if (is8Bit()) | 158 if (is8Bit()) |
| 140 m_data.characters8 = view.characters8() + offset; | 159 m_characters8 = view.characters8() + offset; |
| 141 else | 160 else |
| 142 m_data.characters16 = view.characters16() + offset; | 161 m_characters16 = view.characters16() + offset; |
| 143 } | 162 } |
| 144 | 163 |
| 145 inline StringView::StringView(StringImpl* impl) | 164 inline StringView::StringView(StringImpl* impl) |
| 146 { | 165 { |
| 147 impl ? set(*impl, 0, impl->length()) : clear(); | 166 if (!impl) { |
| 167 clear(); | |
| 168 return; | |
| 169 } | |
| 170 m_impl = impl; | |
| 171 m_length = impl->length(); | |
| 172 m_bytes = impl->bytes(); | |
| 148 } | 173 } |
| 149 | 174 |
| 150 inline StringView::StringView(StringImpl* impl, unsigned offset) | 175 inline StringView::StringView(StringImpl* impl, unsigned offset) |
| 151 { | 176 { |
| 152 impl ? set(*impl, offset, impl->length() - offset) : clear(); | 177 impl ? set(*impl, offset, impl->length() - offset) : clear(); |
| 153 } | 178 } |
| 154 | 179 |
| 155 inline StringView::StringView(StringImpl* impl, unsigned offset, unsigned length ) | 180 inline StringView::StringView(StringImpl* impl, unsigned offset, unsigned length ) |
| 156 { | 181 { |
| 157 impl ? set(*impl, offset, length) : clear(); | 182 impl ? set(*impl, offset, length) : clear(); |
| 158 } | 183 } |
| 159 | 184 |
| 160 inline StringView::StringView(const LChar* chars, unsigned length) | |
| 161 : m_length(length) | |
| 162 , m_is8Bit(true) | |
| 163 { | |
| 164 m_data.characters8 = chars; | |
| 165 } | |
| 166 | |
| 167 inline void StringView::clear() | 185 inline void StringView::clear() |
| 168 { | 186 { |
| 169 m_length = 0; | 187 m_length = 0; |
| 170 m_is8Bit = true; | 188 m_bytes = nullptr; |
| 171 m_data.bytes = nullptr; | 189 m_impl = StringImpl::empty(); // mark as 8 bit. |
| 172 #if DCHECK_IS_ON() | |
| 173 m_impl = nullptr; | |
| 174 #endif | |
| 175 } | 190 } |
| 176 | 191 |
| 177 inline void StringView::set(StringImpl& impl, unsigned offset, unsigned length) | 192 inline void StringView::set(StringImpl& impl, unsigned offset, unsigned length) |
| 178 { | 193 { |
| 179 SECURITY_DCHECK(offset + length <= impl.length()); | 194 SECURITY_DCHECK(offset + length <= impl.length()); |
| 180 m_length = length; | 195 m_length = length; |
| 181 m_is8Bit = impl.is8Bit(); | |
| 182 #if DCHECK_IS_ON() | |
| 183 m_impl = &impl; | 196 m_impl = &impl; |
| 184 #endif | 197 if (impl.is8Bit()) |
| 185 if (m_is8Bit) | 198 m_characters8 = impl.characters8() + offset; |
| 186 m_data.characters8 = impl.characters8() + offset; | |
| 187 else | 199 else |
| 188 m_data.characters16 = impl.characters16() + offset; | 200 m_characters16 = impl.characters16() + offset; |
| 189 } | 201 } |
| 190 | 202 |
| 191 WTF_EXPORT bool equalIgnoringASCIICase(const StringView& a, const StringView& b) ; | 203 WTF_EXPORT bool equalIgnoringASCIICase(const StringView& a, const StringView& b) ; |
| 192 | 204 |
| 193 // TODO(esprehn): Can't make this an overload of WTF::equal since that makes | 205 // TODO(esprehn): Can't make this an overload of WTF::equal since that makes |
| 194 // calls to equal() that pass literal strings ambiguous. Figure out if we can | 206 // calls to equal() that pass literal strings ambiguous. Figure out if we can |
| 195 // replace all the callers with equalStringView and then rename it to equal(). | 207 // replace all the callers with equalStringView and then rename it to equal(). |
| 196 WTF_EXPORT bool equalStringView(const StringView&, const StringView&); | 208 WTF_EXPORT bool equalStringView(const StringView&, const StringView&); |
| 197 | 209 |
| 198 inline bool operator==(const StringView& a, const StringView& b) | 210 inline bool operator==(const StringView& a, const StringView& b) |
| 199 { | 211 { |
| 200 return equalStringView(a, b); | 212 return equalStringView(a, b); |
| 201 } | 213 } |
| 202 | 214 |
| 203 inline bool operator!=(const StringView& a, const StringView& b) | 215 inline bool operator!=(const StringView& a, const StringView& b) |
| 204 { | 216 { |
| 205 return !(a == b); | 217 return !(a == b); |
| 206 } | 218 } |
| 207 | 219 |
| 208 } // namespace WTF | 220 } // namespace WTF |
| 209 | 221 |
| 210 using WTF::StringView; | 222 using WTF::StringView; |
| 211 | 223 |
| 212 #endif | 224 #endif |
| OLD | NEW |