third_party/WebKit/Source/wtf/text/TextCodecLatin1.cpp - Issue 2470043004: Fix vector resize logic when encoding non-BMP chars to latin1 as ?s

Keyboard Shortcuts

	File
u :	up to issue
j / k :	jump to file after / before current file
J / K :	jump to next file with a comment after / before current file
	Side-by-side diff
i :	toggle intra-line diffs
e :	expand all comments
c :	collapse all comments
s :	toggle showing all comments
n / p :	next / previous diff chunk or comment
N / P :	next / previous comment
<Up> / <Down> :	next / previous line

	Issue
u :	up to list of issues
j / k :	jump to patch after / before current patch
o / <Enter> :	open current patch in side-by-side view
i :	open current patch in unified diff view

	Issue List
j / k :	jump to issue after / before current issue
o / <Enter> :	open current issue

Unified Diff: third_party/WebKit/Source/wtf/text/TextCodecLatin1.cpp

Issue 2470043004: Fix vector resize logic when encoding non-BMP chars to latin1 as ?s (Closed)

Patch Set: rebased Created 4 years, 1 month ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: third_party/WebKit/Source/wtf/text/TextCodecLatin1.cpp

diff --git a/third_party/WebKit/Source/wtf/text/TextCodecLatin1.cpp b/third_party/WebKit/Source/wtf/text/TextCodecLatin1.cpp

index 766b7fcd5ae2eae0cb9e5eda4c25503b58dac39e..fe98761f645e1ab4179e81f9b89b619e5a17d358 100644

--- a/third_party/WebKit/Source/wtf/text/TextCodecLatin1.cpp

+++ b/third_party/WebKit/Source/wtf/text/TextCodecLatin1.cpp

@@ -206,13 +206,20 @@ template <typename CharType>

static CString encodeComplexWindowsLatin1(const CharType* characters,

size_t length,

UnencodableHandling handling) {

- Vector<char> result(length);

+ size_t targetLength = length;

+ Vector<char> result(targetLength);

char* bytes = result.data();

size_t resultLength = 0;

for (size_t i = 0; i < length;) {

UChar32 c;

+ // If CharType is LChar the U16_NEXT call reads a byte and increments;

+ // since the convention is that LChar is already latin1 this is safe.

U16_NEXT(characters, i, length, c);

+ // If input was a surrogate pair (non-BMP character) then we overestimated

+ // the length.

+ if (c > 0xffff)

+ --targetLength;

unsigned char b = static_cast<unsigned char>(c);

// Do an efficient check to detect characters other than 00-7F and A0-FF.

if (b != c || (c & 0xE0) == 0x80) {

@@ -225,8 +232,16 @@ static CString encodeComplexWindowsLatin1(const CharType* characters,

UnencodableReplacementArray replacement;

int replacementLength =

TextCodec::getUnencodableReplacement(c, handling, replacement);

- result.grow(resultLength + replacementLength + length - i);

- bytes = result.data();

+ DCHECK_GT(replacementLength, 0);

+ // Only one char was initially reserved per input character, so grow if

+ // necessary. Note that the case of surrogate pairs and

+ // QuestionMarksForUnencodables the result length may be shorter than

+ // the input length.

+ targetLength += replacementLength - 1;

+ if (targetLength > result.size()) {

+ result.grow(targetLength);

+ bytes = result.data();

+ }

memcpy(bytes + resultLength, replacement, replacementLength);

resultLength += replacementLength;

continue;

« no previous file with comments | « third_party/WebKit/Source/wtf/BUILD.gn ('k') | third_party/WebKit/Source/wtf/text/TextCodecLatin1Test.cpp » ('j') | no next file with comments »