url/url_canon_mailtourl.cc - Issue 2820373002: Reland of 'Improve canonicalization of mailto url path components'

Keyboard Shortcuts

	File
u :	up to issue
j / k :	jump to file after / before current file
J / K :	jump to next file with a comment after / before current file
	Side-by-side diff
i :	toggle intra-line diffs
e :	expand all comments
c :	collapse all comments
s :	toggle showing all comments
n / p :	next / previous diff chunk or comment
N / P :	next / previous comment
<Up> / <Down> :	next / previous line

	Issue
u :	up to list of issues
j / k :	jump to patch after / before current patch
o / <Enter> :	open current patch in side-by-side view
i :	open current patch in unified diff view

	Issue List
j / k :	jump to issue after / before current issue
o / <Enter> :	open current issue

Unified Diff: url/url_canon_mailtourl.cc

Issue 2820373002: Reland of 'Improve canonicalization of mailto url path components' (Closed)

Patch Set: Created 3 years, 8 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: url/url_canon_mailtourl.cc

diff --git a/url/url_canon_mailtourl.cc b/url/url_canon_mailtourl.cc

index fb6bc9ab7e70ec62409efc7fa92e29822e09618e..8a7ff1ae6b7a2ccaa44cd17fb58e35f470a4cda0 100644

--- a/url/url_canon_mailtourl.cc

+++ b/url/url_canon_mailtourl.cc

@@ -13,6 +13,23 @@ namespace url {

namespace {

+// Certain characters should be percent-encoded when they appear in the path

+// component of a mailto URL, to improve compatibility and mitigate against

+// command-injection attacks on mailto handlers. See https://crbug.com/711020.

+template <typename UCHAR>

+bool ShouldEncodeMailboxCharacter(UCHAR uch) {

+ if (uch < 0x21 || // space & control characters.

+ uch > 0x7e || // high-ascii characters.

+ uch == 0x22 || // quote.

+ uch == 0x3c || uch == 0x3e || // angle brackets.

+ uch == 0x60 || // backtick.

+ uch == 0x7b || uch == 0x7c || uch == 0x7d // braces and pipe.

+ ) {

+ return true;

+ }

+ return false;

template <typename CHAR, typename UCHAR>

bool DoCanonicalizeMailtoURL(const URLComponentSource<CHAR>& source,

const Parsed& parsed,

@@ -38,12 +55,12 @@ bool DoCanonicalizeMailtoURL(const URLComponentSource<CHAR>& source,

new_parsed->path.begin = output->length();

// Copy the path using path URL's more lax escaping rules.

- // We convert to UTF-8 and escape non-ASCII, but leave all

+ // We convert to UTF-8 and escape non-ASCII, but leave most

// ASCII characters alone.

int end = parsed.path.end();

for (int i = parsed.path.begin; i < end; ++i) {

UCHAR uch = static_cast<UCHAR>(source.path[i]);

- if (uch < 0x20 || uch >= 0x80)

+ if (ShouldEncodeMailboxCharacter<UCHAR>(uch))

success &= AppendUTF8EscapedChar(source.path, &i, end, output);

else

output->push_back(static_cast<char>(uch));

« no previous file with comments | « third_party/WebKit/LayoutTests/fast/url/script-tests/mailto.js ('k') | url/url_canon_unittest.cc » ('j') | no next file with comments »