OLD | NEW |
1 // Copyright 2015 The Chromium Authors. All rights reserved. | 1 // Copyright 2015 The Chromium Authors. All rights reserved. |
2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
4 | 4 |
5 #include "net/cert/internal/verify_name_match.h" | 5 #include "net/cert/internal/verify_name_match.h" |
| 6 |
| 7 #include <string.h> |
| 8 |
| 9 #include "base/stl_util.h" |
| 10 #include "base/strings/string16.h" |
| 11 #include "base/strings/string_util.h" |
| 12 #include "base/strings/utf_string_conversion_utils.h" |
| 13 #include "base/strings/utf_string_conversions.h" |
| 14 #include "base/sys_byteorder.h" |
| 15 #include "base/third_party/icu/icu_utf.h" |
| 16 #include "base/tuple.h" |
6 #include "net/der/input.h" | 17 #include "net/der/input.h" |
| 18 #include "net/der/parser.h" |
| 19 #include "net/der/tag.h" |
7 | 20 |
8 namespace net { | 21 namespace net { |
9 | 22 |
| 23 namespace { |
| 24 |
| 25 // Types of character set checking that NormalizeDirectoryString can perform. |
| 26 enum CharsetEnforcement { |
| 27 NO_ENFORCEMENT, |
| 28 ENFORCE_PRINTABLE_STRING, |
| 29 ENFORCE_ASCII, |
| 30 }; |
| 31 |
| 32 // Normalizes |output|, a UTF-8 encoded string, as if it contained |
| 33 // only ASCII characters. |
| 34 // |
| 35 // This could be considered a partial subset of RFC 5280 rules, and |
| 36 // is compatible with RFC 2459/3280. |
| 37 // |
| 38 // In particular, RFC 5280, Section 7.1 describes how UTF8String |
| 39 // and PrintableString should be compared - using the LDAP StringPrep |
| 40 // profile of RFC 4518, with case folding and whitespace compression. |
| 41 // However, because it is optional for 2459/3280 implementations and because |
| 42 // it's desirable to avoid the size cost of the StringPrep tables, |
| 43 // this function treats |output| as if it was composed of ASCII. |
| 44 // |
| 45 // That is, rather than folding all whitespace characters, it only |
| 46 // folds ' '. Rather than case folding using locale-aware handling, |
| 47 // it only folds A-Z to a-z. |
| 48 // |
| 49 // This gives better results than outright rejecting (due to mismatched |
| 50 // encodings), or from doing a strict binary comparison (the minimum |
| 51 // required by RFC 3280), and is sufficient for those certificates |
| 52 // publicly deployed. |
| 53 // |
| 54 // If |charset_enforcement| is not NO_ENFORCEMENT and |output| contains any |
| 55 // characters not allowed in the specified charset, returns false. |
| 56 // |
| 57 // NOTE: |output| will be modified regardless of the return. |
| 58 WARN_UNUSED_RESULT bool NormalizeDirectoryString( |
| 59 CharsetEnforcement charset_enforcement, |
| 60 std::string* output) { |
| 61 // Normalized version will always be equal or shorter than input. |
| 62 // Normalize in place and then truncate the output if necessary. |
| 63 std::string::const_iterator read_iter = output->begin(); |
| 64 std::string::iterator write_iter = output->begin(); |
| 65 |
| 66 for (; read_iter != output->end() && *read_iter == ' '; ++read_iter) { |
| 67 // Ignore leading whitespace. |
| 68 } |
| 69 |
| 70 for (; read_iter != output->end(); ++read_iter) { |
| 71 const unsigned char c = *read_iter; |
| 72 if (c == ' ') { |
| 73 // If there are non-whitespace characters remaining in input, compress |
| 74 // multiple whitespace chars to a single space, otherwise ignore trailing |
| 75 // whitespace. |
| 76 std::string::const_iterator next_iter = read_iter + 1; |
| 77 if (next_iter != output->end() && *next_iter != ' ') |
| 78 *(write_iter++) = ' '; |
| 79 } else if (c >= 'A' && c <= 'Z') { |
| 80 // Fold case. |
| 81 *(write_iter++) = c + ('a' - 'A'); |
| 82 } else { |
| 83 // Note that these checks depend on the characters allowed by earlier |
| 84 // conditions also being valid for the enforced charset. |
| 85 switch (charset_enforcement) { |
| 86 case ENFORCE_PRINTABLE_STRING: |
| 87 // See NormalizePrintableStringValue comment for the acceptable list |
| 88 // of characters. |
| 89 if (!((c >= 'a' && c <= 'z') || (c >= '\'' && c <= ':') || c == '=' || |
| 90 c == '?')) |
| 91 return false; |
| 92 break; |
| 93 case ENFORCE_ASCII: |
| 94 if (c > 0x7F) |
| 95 return false; |
| 96 break; |
| 97 case NO_ENFORCEMENT: |
| 98 break; |
| 99 } |
| 100 *(write_iter++) = c; |
| 101 } |
| 102 } |
| 103 if (write_iter != output->end()) |
| 104 output->erase(write_iter, output->end()); |
| 105 return true; |
| 106 } |
| 107 |
| 108 // Normalizes the DER-encoded PrintableString value |in| according to |
| 109 // RFC 2459, Section 4.1.2.4 |
| 110 // |
| 111 // Briefly, normalization involves removing leading and trailing |
| 112 // whitespace, folding multiple whitespace characters into a single |
| 113 // whitespace character, and normalizing on case (this function |
| 114 // normalizes to lowercase). |
| 115 // |
| 116 // During normalization, this function also validates that |in| |
| 117 // is properly encoded - that is, that it restricts to the character |
| 118 // set defined in X.680 (2008), Section 41.4, Table 10. X.680 defines |
| 119 // the valid characters as |
| 120 // a-z A-Z 0-9 (space) ' ( ) + , - . / : = ? |
| 121 // |
| 122 // However, due to an old OpenSSL encoding bug, a number of |
| 123 // certificates have also included '*', which has historically been |
| 124 // allowed by implementations, and so is also allowed here. |
| 125 // |
| 126 // If |in| can be normalized, returns true and sets |output| to the |
| 127 // case folded, normalized value. If |in| is invalid, returns false. |
| 128 // NOTE: |output| will be modified regardless of the return. |
| 129 WARN_UNUSED_RESULT bool NormalizePrintableStringValue(const der::Input& in, |
| 130 std::string* output) { |
| 131 output->assign(in.AsString()); |
| 132 return NormalizeDirectoryString(ENFORCE_PRINTABLE_STRING, output); |
| 133 } |
| 134 |
| 135 // Normalized a UTF8String value. See the comment for NormalizeDirectoryString |
| 136 // for details. |
| 137 // |
| 138 // If |in| can be normalized, returns true and sets |output| to the |
| 139 // case folded, normalized value. If |in| is invalid, returns false. |
| 140 // NOTE: |output| will be modified regardless of the return. |
| 141 WARN_UNUSED_RESULT bool NormalizeUtf8StringValue(const der::Input& in, |
| 142 std::string* output) { |
| 143 output->assign(in.AsString()); |
| 144 return NormalizeDirectoryString(NO_ENFORCEMENT, output); |
| 145 } |
| 146 |
| 147 // IA5String is ISO/IEC Registrations 1 and 6 from the ISO |
| 148 // "International Register of Coded Character Sets to be used |
| 149 // with Escape Sequences", plus space and delete. That's just the |
| 150 // polite way of saying 0x00 - 0x7F, aka ASCII (or, more formally, |
| 151 // ISO/IEC 646) |
| 152 // |
| 153 // If |in| can be normalized, returns true and sets |output| to the case folded, |
| 154 // normalized value. If |in| is invalid, returns false. |
| 155 // NOTE: |output| will be modified regardless of the return. |
| 156 WARN_UNUSED_RESULT bool NormalizeIA5StringValue(const der::Input& in, |
| 157 std::string* output) { |
| 158 output->assign(in.AsString()); |
| 159 return NormalizeDirectoryString(ENFORCE_ASCII, output); |
| 160 } |
| 161 |
| 162 // Converts BMPString value to UTF-8 and then normalizes it. See the comment for |
| 163 // NormalizeDirectoryString for details. |
| 164 // |
| 165 // If |in| can be normalized, returns true and sets |output| to the case folded, |
| 166 // normalized value. If |in| is invalid, returns false. |
| 167 // NOTE: |output| will be modified regardless of the return. |
| 168 WARN_UNUSED_RESULT bool NormalizeBmpStringValue(const der::Input& in, |
| 169 std::string* output) { |
| 170 if (in.Length() % 2 != 0) |
| 171 return false; |
| 172 |
| 173 base::string16 in_16bit; |
| 174 if (in.Length()) { |
| 175 memcpy(base::WriteInto(&in_16bit, in.Length() / 2 + 1), in.UnsafeData(), |
| 176 in.Length()); |
| 177 } |
| 178 for (base::char16& c : in_16bit) { |
| 179 // BMPString is UCS-2 in big-endian order. |
| 180 c = base::NetToHost16(c); |
| 181 |
| 182 // BMPString only supports codepoints in the Basic Multilingual Plane; |
| 183 // surrogates are not allowed. |
| 184 if (CBU_IS_SURROGATE(c)) |
| 185 return false; |
| 186 } |
| 187 if (!base::UTF16ToUTF8(in_16bit.data(), in_16bit.size(), output)) |
| 188 return false; |
| 189 return NormalizeDirectoryString(NO_ENFORCEMENT, output); |
| 190 } |
| 191 |
| 192 // Converts UniversalString value to UTF-8 and then normalizes it. See the |
| 193 // comment for NormalizeDirectoryString for details. |
| 194 // |
| 195 // If |in| can be normalized, returns true and sets |output| to the case folded, |
| 196 // normalized value. If |in| is invalid, returns false. |
| 197 // NOTE: |output| will be modified regardless of the return. |
| 198 WARN_UNUSED_RESULT bool NormalizeUniversalStringValue(const der::Input& in, |
| 199 std::string* output) { |
| 200 if (in.Length() % 4 != 0) |
| 201 return false; |
| 202 |
| 203 std::vector<uint32_t> in_32bit(in.Length() / 4); |
| 204 if (in.Length()) |
| 205 memcpy(vector_as_array(&in_32bit), in.UnsafeData(), in.Length()); |
| 206 for (const uint32_t c : in_32bit) { |
| 207 // UniversalString is UCS-4 in big-endian order. |
| 208 uint32_t codepoint = base::NetToHost32(c); |
| 209 if (!CBU_IS_UNICODE_CHAR(codepoint)) |
| 210 return false; |
| 211 |
| 212 base::WriteUnicodeCharacter(codepoint, output); |
| 213 } |
| 214 return NormalizeDirectoryString(NO_ENFORCEMENT, output); |
| 215 } |
| 216 |
| 217 // Converts the string |value| to UTF-8, normalizes it, and stores in |output|. |
| 218 // |tag| must one of the types for which IsNormalizableDirectoryString is true. |
| 219 // |
| 220 // If |value| can be normalized, returns true and sets |output| to the case |
| 221 // folded, normalized value. If |value| is invalid, returns false. |
| 222 // NOTE: |output| will be modified regardless of the return. |
| 223 WARN_UNUSED_RESULT bool NormalizeValue(const der::Tag tag, |
| 224 const der::Input& value, |
| 225 std::string* output) { |
| 226 switch (tag) { |
| 227 case der::kPrintableString: |
| 228 return NormalizePrintableStringValue(value, output); |
| 229 case der::kUtf8String: |
| 230 return NormalizeUtf8StringValue(value, output); |
| 231 case der::kIA5String: |
| 232 return NormalizeIA5StringValue(value, output); |
| 233 case der::kUniversalString: |
| 234 return NormalizeUniversalStringValue(value, output); |
| 235 case der::kBmpString: |
| 236 return NormalizeBmpStringValue(value, output); |
| 237 default: |
| 238 NOTREACHED(); |
| 239 return false; |
| 240 } |
| 241 } |
| 242 |
| 243 // Returns true if |tag| is a string type that NormalizeValue can handle. |
| 244 bool IsNormalizableDirectoryString(der::Tag tag) { |
| 245 switch (tag) { |
| 246 case der::kPrintableString: |
| 247 case der::kUtf8String: |
| 248 // RFC 5280 only requires handling IA5String for comparing domainComponent |
| 249 // values, but handling it here avoids the need to special case anything. |
| 250 case der::kIA5String: |
| 251 case der::kUniversalString: |
| 252 case der::kBmpString: |
| 253 return true; |
| 254 // TeletexString isn't normalized. Section 8 of RFC 5280 briefly |
| 255 // describes the historical confusion between treating TeletexString |
| 256 // as Latin1String vs T.61, and there are even incompatibilities within |
| 257 // T.61 implementations. As this time is virtually unused, simply |
| 258 // treat it with a binary comparison, as permitted by RFC 3280/5280. |
| 259 default: |
| 260 return false; |
| 261 } |
| 262 } |
| 263 |
| 264 // Returns true if the AttributeValue (|a_tag|, |a_value|) matches (|b_tag|, |
| 265 // |b_value|). |
| 266 bool VerifyValueMatch(const der::Tag a_tag, |
| 267 const der::Input& a_value, |
| 268 const der::Tag b_tag, |
| 269 const der::Input& b_value) { |
| 270 if (IsNormalizableDirectoryString(a_tag) && |
| 271 IsNormalizableDirectoryString(b_tag)) { |
| 272 std::string a_normalized, b_normalized; |
| 273 if (!NormalizeValue(a_tag, a_value, &a_normalized) || |
| 274 !NormalizeValue(b_tag, b_value, &b_normalized)) |
| 275 return false; |
| 276 return a_normalized == b_normalized; |
| 277 } |
| 278 // Attributes encoded with different types may be assumed to be unequal. |
| 279 if (a_tag != b_tag) |
| 280 return false; |
| 281 // All other types use binary comparison. |
| 282 return a_value.Equals(b_value); |
| 283 } |
| 284 |
| 285 struct AttributeTypeAndValue { |
| 286 AttributeTypeAndValue(der::Input in_type, |
| 287 der::Tag in_value_tag, |
| 288 der::Input in_value) |
| 289 : type(in_type), value_tag(in_value_tag), value(in_value) {} |
| 290 der::Input type; |
| 291 der::Tag value_tag; |
| 292 der::Input value; |
| 293 }; |
| 294 |
| 295 // Parses all the ASN.1 AttributeTypeAndValue elements in |parser| and stores |
| 296 // each as an AttributeTypeAndValue object in |out|. |
| 297 // |
| 298 // AttributeTypeAndValue is defined in RFC 5280 section 4.1.2.4: |
| 299 // |
| 300 // AttributeTypeAndValue ::= SEQUENCE { |
| 301 // type AttributeType, |
| 302 // value AttributeValue } |
| 303 // |
| 304 // AttributeType ::= OBJECT IDENTIFIER |
| 305 // |
| 306 // AttributeValue ::= ANY -- DEFINED BY AttributeType |
| 307 // |
| 308 // DirectoryString ::= CHOICE { |
| 309 // teletexString TeletexString (SIZE (1..MAX)), |
| 310 // printableString PrintableString (SIZE (1..MAX)), |
| 311 // universalString UniversalString (SIZE (1..MAX)), |
| 312 // utf8String UTF8String (SIZE (1..MAX)), |
| 313 // bmpString BMPString (SIZE (1..MAX)) } |
| 314 // |
| 315 // The type of the component AttributeValue is determined by the AttributeType; |
| 316 // in general it will be a DirectoryString. |
| 317 WARN_UNUSED_RESULT bool ReadRdn(der::Parser* parser, |
| 318 std::vector<AttributeTypeAndValue>* out) { |
| 319 while (parser->HasMore()) { |
| 320 der::Parser attr_type_and_value; |
| 321 if (!parser->ReadSequence(&attr_type_and_value)) |
| 322 return false; |
| 323 // Read the attribute type, which must be an OBJECT IDENTIFIER. |
| 324 der::Input type; |
| 325 if (!attr_type_and_value.ReadTag(der::kOid, &type)) |
| 326 return false; |
| 327 |
| 328 // Read the attribute value. |
| 329 der::Tag tag; |
| 330 der::Input value; |
| 331 if (!attr_type_and_value.ReadTagAndValue(&tag, &value)) |
| 332 return false; |
| 333 |
| 334 // There should be no more elements in the sequence after reading the |
| 335 // attribute type and value. |
| 336 if (attr_type_and_value.HasMore()) |
| 337 return false; |
| 338 |
| 339 out->push_back(AttributeTypeAndValue(type, tag, value)); |
| 340 } |
| 341 return true; |
| 342 } |
| 343 |
| 344 // Verifies that |a_parser| and |b_parser| are the same length and that every |
| 345 // AttributeTypeAndValue in |a_parser| has a matching AttributeTypeAndValue in |
| 346 // |b_parser|. |
| 347 bool VerifyRdnMatch(der::Parser* a_parser, der::Parser* b_parser) { |
| 348 std::vector<AttributeTypeAndValue> a_type_and_values, b_type_and_values; |
| 349 if (!ReadRdn(a_parser, &a_type_and_values) || |
| 350 !ReadRdn(b_parser, &b_type_and_values)) |
| 351 return false; |
| 352 |
| 353 // RFC 5280 section 4.1.2.4 |
| 354 // RelativeDistinguishedName ::= SET SIZE (1..MAX) OF AttributeTypeAndValue |
| 355 if (a_type_and_values.empty() || b_type_and_values.empty()) |
| 356 return false; |
| 357 |
| 358 // RFC 5280 section 7.1: |
| 359 // Two relative distinguished names RDN1 and RDN2 match if they have the same |
| 360 // number of naming attributes and for each naming attribute in RDN1 there is |
| 361 // a matching naming attribute in RDN2. |
| 362 if (a_type_and_values.size() != b_type_and_values.size()) |
| 363 return false; |
| 364 |
| 365 // The ordering of elements may differ due to denormalized values sorting |
| 366 // differently in the DER encoding. Since the number of elements should be |
| 367 // small, a naive linear search for each element should be fine. (Hostile |
| 368 // certificates already have ways to provoke pathological behavior.) |
| 369 for (const auto& a : a_type_and_values) { |
| 370 bool matched = false; |
| 371 for (const auto& b : b_type_and_values) { |
| 372 if (a.type.Equals(b.type) && |
| 373 VerifyValueMatch(a.value_tag, a.value, b.value_tag, b.value)) { |
| 374 matched = true; |
| 375 break; |
| 376 } |
| 377 } |
| 378 if (!matched) |
| 379 return false; |
| 380 } |
| 381 |
| 382 // Every element in |a_type_and_values| had a matching element in |
| 383 // |b_type_and_values|. |
| 384 return true; |
| 385 } |
| 386 |
| 387 } // namespace |
| 388 |
| 389 // |a| and |b| are ASN.1 RDNSequence values (not including the Sequence tag), |
| 390 // defined in RFC 5280 section 4.1.2.4: |
| 391 // |
| 392 // Name ::= CHOICE { -- only one possibility for now -- |
| 393 // rdnSequence RDNSequence } |
| 394 // |
| 395 // RDNSequence ::= SEQUENCE OF RelativeDistinguishedName |
| 396 // |
| 397 // RelativeDistinguishedName ::= |
| 398 // SET SIZE (1..MAX) OF AttributeTypeAndValue |
10 bool VerifyNameMatch(const der::Input& a, const der::Input& b) { | 399 bool VerifyNameMatch(const der::Input& a, const der::Input& b) { |
11 // TODO(mattm): use normalization as specified in RFC 5280 section 7. | 400 // Empty Names are allowed. RFC 5280 section 4.1.2.4 requires "The issuer |
12 return a.Equals(b); | 401 // field MUST contain a non-empty distinguished name (DN)", while section |
| 402 // 4.1.2.6 allows for the Subject to be empty in certain cases. The caller is |
| 403 // assumed to have verified those conditions. |
| 404 |
| 405 // RFC 5280 section 7.1: |
| 406 // Two distinguished names DN1 and DN2 match if they have the same number of |
| 407 // RDNs, for each RDN in DN1 there is a matching RDN in DN2, and the matching |
| 408 // RDNs appear in the same order in both DNs. |
| 409 |
| 410 // First just check if the inputs have the same number of RDNs: |
| 411 der::Parser a_rdn_sequence_counter(a); |
| 412 der::Parser b_rdn_sequence_counter(b); |
| 413 while (a_rdn_sequence_counter.HasMore() && b_rdn_sequence_counter.HasMore()) { |
| 414 if (!a_rdn_sequence_counter.SkipTag(der::kSet) || |
| 415 !b_rdn_sequence_counter.SkipTag(der::kSet)) { |
| 416 return false; |
| 417 } |
| 418 } |
| 419 if (a_rdn_sequence_counter.HasMore() || b_rdn_sequence_counter.HasMore()) |
| 420 return false; |
| 421 |
| 422 // Same number of RDNs, now check if they match. |
| 423 der::Parser a_rdn_sequence(a); |
| 424 der::Parser b_rdn_sequence(b); |
| 425 while (a_rdn_sequence.HasMore() && b_rdn_sequence.HasMore()) { |
| 426 der::Parser a_rdn, b_rdn; |
| 427 if (!a_rdn_sequence.ReadConstructed(der::kSet, &a_rdn) || |
| 428 !b_rdn_sequence.ReadConstructed(der::kSet, &b_rdn)) { |
| 429 return false; |
| 430 } |
| 431 if (!VerifyRdnMatch(&a_rdn, &b_rdn)) |
| 432 return false; |
| 433 } |
| 434 |
| 435 return true; |
13 } | 436 } |
14 | 437 |
15 } // namespace net | 438 } // namespace net |
OLD | NEW |