|  | // Copyright 2015 The Chromium Authors. All rights reserved. | 
|  | // Use of this source code is governed by a BSD-style license that can be | 
|  | // found in the LICENSE file. | 
|  |  | 
|  | #include "net/cert/internal/verify_name_match.h" | 
|  |  | 
|  | #include <string.h> | 
|  |  | 
|  | #include "base/stl_util.h" | 
|  | #include "base/strings/string16.h" | 
|  | #include "base/strings/string_util.h" | 
|  | #include "base/strings/utf_string_conversion_utils.h" | 
|  | #include "base/strings/utf_string_conversions.h" | 
|  | #include "base/sys_byteorder.h" | 
|  | #include "base/third_party/icu/icu_utf.h" | 
|  | #include "base/tuple.h" | 
|  | #include "net/der/input.h" | 
|  | #include "net/der/parser.h" | 
|  | #include "net/der/tag.h" | 
|  |  | 
|  | namespace net { | 
|  |  | 
|  | namespace { | 
|  |  | 
|  | // Types of character set checking that NormalizeDirectoryString can perform. | 
|  | enum CharsetEnforcement { | 
|  | NO_ENFORCEMENT, | 
|  | ENFORCE_PRINTABLE_STRING, | 
|  | ENFORCE_ASCII, | 
|  | }; | 
|  |  | 
|  | // Normalizes |output|, a UTF-8 encoded string, as if it contained | 
|  | // only ASCII characters. | 
|  | // | 
|  | // This could be considered a partial subset of RFC 5280 rules, and | 
|  | // is compatible with RFC 2459/3280. | 
|  | // | 
|  | // In particular, RFC 5280, Section 7.1 describes how UTF8String | 
|  | // and PrintableString should be compared - using the LDAP StringPrep | 
|  | // profile of RFC 4518, with case folding and whitespace compression. | 
|  | // However, because it is optional for 2459/3280 implementations and because | 
|  | // it's desirable to avoid the size cost of the StringPrep tables, | 
|  | // this function treats |output| as if it was composed of ASCII. | 
|  | // | 
|  | // That is, rather than folding all whitespace characters, it only | 
|  | // folds ' '. Rather than case folding using locale-aware handling, | 
|  | // it only folds A-Z to a-z. | 
|  | // | 
|  | // This gives better results than outright rejecting (due to mismatched | 
|  | // encodings), or from doing a strict binary comparison (the minimum | 
|  | // required by RFC 3280), and is sufficient for those certificates | 
|  | // publicly deployed. | 
|  | // | 
|  | // If |charset_enforcement| is not NO_ENFORCEMENT and |output| contains any | 
|  | // characters not allowed in the specified charset, returns false. | 
|  | // | 
|  | // NOTE: |output| will be modified regardless of the return. | 
|  | WARN_UNUSED_RESULT bool NormalizeDirectoryString( | 
|  | CharsetEnforcement charset_enforcement, | 
|  | std::string* output) { | 
|  | // Normalized version will always be equal or shorter than input. | 
|  | // Normalize in place and then truncate the output if necessary. | 
|  | std::string::const_iterator read_iter = output->begin(); | 
|  | std::string::iterator write_iter = output->begin(); | 
|  |  | 
|  | for (; read_iter != output->end() && *read_iter == ' '; ++read_iter) { | 
|  | // Ignore leading whitespace. | 
|  | } | 
|  |  | 
|  | for (; read_iter != output->end(); ++read_iter) { | 
|  | const unsigned char c = *read_iter; | 
|  | if (c == ' ') { | 
|  | // If there are non-whitespace characters remaining in input, compress | 
|  | // multiple whitespace chars to a single space, otherwise ignore trailing | 
|  | // whitespace. | 
|  | std::string::const_iterator next_iter = read_iter + 1; | 
|  | if (next_iter != output->end() && *next_iter != ' ') | 
|  | *(write_iter++) = ' '; | 
|  | } else if (c >= 'A' && c <= 'Z') { | 
|  | // Fold case. | 
|  | *(write_iter++) = c + ('a' - 'A'); | 
|  | } else { | 
|  | // Note that these checks depend on the characters allowed by earlier | 
|  | // conditions also being valid for the enforced charset. | 
|  | switch (charset_enforcement) { | 
|  | case ENFORCE_PRINTABLE_STRING: | 
|  | // See NormalizePrintableStringValue comment for the acceptable list | 
|  | // of characters. | 
|  | if (!((c >= 'a' && c <= 'z') || (c >= '\'' && c <= ':') || c == '=' || | 
|  | c == '?')) | 
|  | return false; | 
|  | break; | 
|  | case ENFORCE_ASCII: | 
|  | if (c > 0x7F) | 
|  | return false; | 
|  | break; | 
|  | case NO_ENFORCEMENT: | 
|  | break; | 
|  | } | 
|  | *(write_iter++) = c; | 
|  | } | 
|  | } | 
|  | if (write_iter != output->end()) | 
|  | output->erase(write_iter, output->end()); | 
|  | return true; | 
|  | } | 
|  |  | 
|  | // Normalizes the DER-encoded PrintableString value |in| according to | 
|  | // RFC 2459, Section 4.1.2.4 | 
|  | // | 
|  | // Briefly, normalization involves removing leading and trailing | 
|  | // whitespace, folding multiple whitespace characters into a single | 
|  | // whitespace character, and normalizing on case (this function | 
|  | // normalizes to lowercase). | 
|  | // | 
|  | // During normalization, this function also validates that |in| | 
|  | // is properly encoded - that is, that it restricts to the character | 
|  | // set defined in X.680 (2008), Section 41.4, Table 10. X.680 defines | 
|  | // the valid characters as | 
|  | //   a-z A-Z 0-9 (space) ' ( ) + , - . / : = ? | 
|  | // | 
|  | // However, due to an old OpenSSL encoding bug, a number of | 
|  | // certificates have also included '*', which has historically been | 
|  | // allowed by implementations, and so is also allowed here. | 
|  | // | 
|  | // If |in| can be normalized, returns true and sets |output| to the | 
|  | // case folded, normalized value. If |in| is invalid, returns false. | 
|  | // NOTE: |output| will be modified regardless of the return. | 
|  | WARN_UNUSED_RESULT bool NormalizePrintableStringValue(const der::Input& in, | 
|  | std::string* output) { | 
|  | in.AsString().swap(*output); | 
|  | return NormalizeDirectoryString(ENFORCE_PRINTABLE_STRING, output); | 
|  | } | 
|  |  | 
|  | // Normalized a UTF8String value. See the comment for NormalizeDirectoryString | 
|  | // for details. | 
|  | // | 
|  | // If |in| can be normalized, returns true and sets |output| to the | 
|  | // case folded, normalized value. If |in| is invalid, returns false. | 
|  | // NOTE: |output| will be modified regardless of the return. | 
|  | WARN_UNUSED_RESULT bool NormalizeUtf8StringValue(const der::Input& in, | 
|  | std::string* output) { | 
|  | in.AsString().swap(*output); | 
|  | return NormalizeDirectoryString(NO_ENFORCEMENT, output); | 
|  | } | 
|  |  | 
|  | // IA5String is ISO/IEC Registrations 1 and 6 from the ISO | 
|  | // "International Register of Coded Character Sets to be used | 
|  | // with Escape Sequences", plus space and delete. That's just the | 
|  | // polite way of saying 0x00 - 0x7F, aka ASCII (or, more formally, | 
|  | // ISO/IEC 646) | 
|  | // | 
|  | // If |in| can be normalized, returns true and sets |output| to the case folded, | 
|  | // normalized value. If |in| is invalid, returns false. | 
|  | // NOTE: |output| will be modified regardless of the return. | 
|  | WARN_UNUSED_RESULT bool NormalizeIA5StringValue(const der::Input& in, | 
|  | std::string* output) { | 
|  | in.AsString().swap(*output); | 
|  | return NormalizeDirectoryString(ENFORCE_ASCII, output); | 
|  | } | 
|  |  | 
|  | // Converts BMPString value to UTF-8 and then normalizes it. See the comment for | 
|  | // NormalizeDirectoryString for details. | 
|  | // | 
|  | // If |in| can be normalized, returns true and sets |output| to the case folded, | 
|  | // normalized value. If |in| is invalid, returns false. | 
|  | // NOTE: |output| will be modified regardless of the return. | 
|  | WARN_UNUSED_RESULT bool NormalizeBmpStringValue(const der::Input& in, | 
|  | std::string* output) { | 
|  | if (in.Length() % 2 != 0) | 
|  | return false; | 
|  |  | 
|  | base::string16 in_16bit; | 
|  | if (in.Length()) { | 
|  | memcpy(base::WriteInto(&in_16bit, in.Length() / 2 + 1), in.UnsafeData(), | 
|  | in.Length()); | 
|  | } | 
|  | for (base::char16& c : in_16bit) { | 
|  | // BMPString is UCS-2 in big-endian order. | 
|  | c = base::NetToHost16(c); | 
|  |  | 
|  | // BMPString only supports codepoints in the Basic Multilingual Plane; | 
|  | // surrogates are not allowed. | 
|  | if (CBU_IS_SURROGATE(c)) | 
|  | return false; | 
|  | } | 
|  | if (!base::UTF16ToUTF8(in_16bit.data(), in_16bit.size(), output)) | 
|  | return false; | 
|  | return NormalizeDirectoryString(NO_ENFORCEMENT, output); | 
|  | } | 
|  |  | 
|  | // Converts UniversalString value to UTF-8 and then normalizes it. See the | 
|  | // comment for NormalizeDirectoryString for details. | 
|  | // | 
|  | // If |in| can be normalized, returns true and sets |output| to the case folded, | 
|  | // normalized value. If |in| is invalid, returns false. | 
|  | // NOTE: |output| will be modified regardless of the return. | 
|  | WARN_UNUSED_RESULT bool NormalizeUniversalStringValue(const der::Input& in, | 
|  | std::string* output) { | 
|  | if (in.Length() % 4 != 0) | 
|  | return false; | 
|  |  | 
|  | std::vector<uint32_t> in_32bit(in.Length() / 4); | 
|  | if (in.Length()) | 
|  | memcpy(vector_as_array(&in_32bit), in.UnsafeData(), in.Length()); | 
|  | for (const uint32_t c : in_32bit) { | 
|  | // UniversalString is UCS-4 in big-endian order. | 
|  | uint32_t codepoint = base::NetToHost32(c); | 
|  | if (!CBU_IS_UNICODE_CHAR(codepoint)) | 
|  | return false; | 
|  |  | 
|  | base::WriteUnicodeCharacter(codepoint, output); | 
|  | } | 
|  | return NormalizeDirectoryString(NO_ENFORCEMENT, output); | 
|  | } | 
|  |  | 
|  | // Converts the string |value| to UTF-8, normalizes it, and stores in |output|. | 
|  | // |tag| must one of the types for which IsNormalizableDirectoryString is true. | 
|  | // | 
|  | // If |value| can be normalized, returns true and sets |output| to the case | 
|  | // folded, normalized value. If |value| is invalid, returns false. | 
|  | // NOTE: |output| will be modified regardless of the return. | 
|  | WARN_UNUSED_RESULT bool NormalizeValue(const der::Tag tag, | 
|  | const der::Input& value, | 
|  | std::string* output) { | 
|  | switch (tag) { | 
|  | case der::kPrintableString: | 
|  | return NormalizePrintableStringValue(value, output); | 
|  | case der::kUtf8String: | 
|  | return NormalizeUtf8StringValue(value, output); | 
|  | case der::kIA5String: | 
|  | return NormalizeIA5StringValue(value, output); | 
|  | case der::kUniversalString: | 
|  | return NormalizeUniversalStringValue(value, output); | 
|  | case der::kBmpString: | 
|  | return NormalizeBmpStringValue(value, output); | 
|  | default: | 
|  | NOTREACHED(); | 
|  | return false; | 
|  | } | 
|  | } | 
|  |  | 
|  | // Returns true if |tag| is a string type that NormalizeValue can handle. | 
|  | bool IsNormalizableDirectoryString(der::Tag tag) { | 
|  | switch (tag) { | 
|  | case der::kPrintableString: | 
|  | case der::kUtf8String: | 
|  | // RFC 5280 only requires handling IA5String for comparing domainComponent | 
|  | // values, but handling it here avoids the need to special case anything. | 
|  | case der::kIA5String: | 
|  | case der::kUniversalString: | 
|  | case der::kBmpString: | 
|  | return true; | 
|  | // TeletexString isn't normalized. Section 8 of RFC 5280 briefly | 
|  | // describes the historical confusion between treating TeletexString | 
|  | // as Latin1String vs T.61, and there are even incompatibilities within | 
|  | // T.61 implementations. As this time is virtually unused, simply | 
|  | // treat it with a binary comparison, as permitted by RFC 3280/5280. | 
|  | default: | 
|  | return false; | 
|  | } | 
|  | } | 
|  |  | 
|  | // Returns true if the AttributeValue (|a_tag|, |a_value|) matches (|b_tag|, | 
|  | // |b_value|). | 
|  | bool VerifyValueMatch(const der::Tag a_tag, | 
|  | const der::Input& a_value, | 
|  | const der::Tag b_tag, | 
|  | const der::Input& b_value) { | 
|  | if (IsNormalizableDirectoryString(a_tag) && | 
|  | IsNormalizableDirectoryString(b_tag)) { | 
|  | std::string a_normalized, b_normalized; | 
|  | if (!NormalizeValue(a_tag, a_value, &a_normalized) || | 
|  | !NormalizeValue(b_tag, b_value, &b_normalized)) | 
|  | return false; | 
|  | return a_normalized == b_normalized; | 
|  | } | 
|  | // Attributes encoded with different types may be assumed to be unequal. | 
|  | if (a_tag != b_tag) | 
|  | return false; | 
|  | // All other types use binary comparison. | 
|  | return a_value.Equals(b_value); | 
|  | } | 
|  |  | 
|  | struct AttributeTypeAndValue { | 
|  | AttributeTypeAndValue(der::Input in_type, | 
|  | der::Tag in_value_tag, | 
|  | der::Input in_value) | 
|  | : type(in_type), value_tag(in_value_tag), value(in_value) {} | 
|  | der::Input type; | 
|  | der::Tag value_tag; | 
|  | der::Input value; | 
|  | }; | 
|  |  | 
|  | // Parses all the ASN.1 AttributeTypeAndValue elements in |parser| and stores | 
|  | // each as an AttributeTypeAndValue object in |out|. | 
|  | // | 
|  | // AttributeTypeAndValue is defined in RFC 5280 section 4.1.2.4: | 
|  | // | 
|  | // AttributeTypeAndValue ::= SEQUENCE { | 
|  | //   type     AttributeType, | 
|  | //   value    AttributeValue } | 
|  | // | 
|  | // AttributeType ::= OBJECT IDENTIFIER | 
|  | // | 
|  | // AttributeValue ::= ANY -- DEFINED BY AttributeType | 
|  | // | 
|  | // DirectoryString ::= CHOICE { | 
|  | //       teletexString           TeletexString (SIZE (1..MAX)), | 
|  | //       printableString         PrintableString (SIZE (1..MAX)), | 
|  | //       universalString         UniversalString (SIZE (1..MAX)), | 
|  | //       utf8String              UTF8String (SIZE (1..MAX)), | 
|  | //       bmpString               BMPString (SIZE (1..MAX)) } | 
|  | // | 
|  | // The type of the component AttributeValue is determined by the AttributeType; | 
|  | // in general it will be a DirectoryString. | 
|  | WARN_UNUSED_RESULT bool ReadRdn(der::Parser* parser, | 
|  | std::vector<AttributeTypeAndValue>* out) { | 
|  | while (parser->HasMore()) { | 
|  | der::Parser attr_type_and_value; | 
|  | if (!parser->ReadSequence(&attr_type_and_value)) | 
|  | return false; | 
|  | // Read the attribute type, which must be an OBJECT IDENTIFIER. | 
|  | der::Input type; | 
|  | if (!attr_type_and_value.ReadTag(der::kOid, &type)) | 
|  | return false; | 
|  |  | 
|  | // Read the attribute value. | 
|  | der::Tag tag; | 
|  | der::Input value; | 
|  | if (!attr_type_and_value.ReadTagAndValue(&tag, &value)) | 
|  | return false; | 
|  |  | 
|  | // There should be no more elements in the sequence after reading the | 
|  | // attribute type and value. | 
|  | if (attr_type_and_value.HasMore()) | 
|  | return false; | 
|  |  | 
|  | out->push_back(AttributeTypeAndValue(type, tag, value)); | 
|  | } | 
|  | return true; | 
|  | } | 
|  |  | 
|  | // Verifies that |a_parser| and |b_parser| are the same length and that every | 
|  | // AttributeTypeAndValue in |a_parser| has a matching AttributeTypeAndValue in | 
|  | // |b_parser|. | 
|  | bool VerifyRdnMatch(der::Parser* a_parser, der::Parser* b_parser) { | 
|  | std::vector<AttributeTypeAndValue> a_type_and_values, b_type_and_values; | 
|  | if (!ReadRdn(a_parser, &a_type_and_values) || | 
|  | !ReadRdn(b_parser, &b_type_and_values)) | 
|  | return false; | 
|  |  | 
|  | // RFC 5280 section 4.1.2.4 | 
|  | // RelativeDistinguishedName ::= SET SIZE (1..MAX) OF AttributeTypeAndValue | 
|  | if (a_type_and_values.empty() || b_type_and_values.empty()) | 
|  | return false; | 
|  |  | 
|  | // RFC 5280 section 7.1: | 
|  | // Two relative distinguished names RDN1 and RDN2 match if they have the same | 
|  | // number of naming attributes and for each naming attribute in RDN1 there is | 
|  | // a matching naming attribute in RDN2. | 
|  | if (a_type_and_values.size() != b_type_and_values.size()) | 
|  | return false; | 
|  |  | 
|  | // The ordering of elements may differ due to denormalized values sorting | 
|  | // differently in the DER encoding. Since the number of elements should be | 
|  | // small, a naive linear search for each element should be fine. (Hostile | 
|  | // certificates already have ways to provoke pathological behavior.) | 
|  | for (const auto& a : a_type_and_values) { | 
|  | bool matched = false; | 
|  | for (const auto& b : b_type_and_values) { | 
|  | if (a.type.Equals(b.type) && | 
|  | VerifyValueMatch(a.value_tag, a.value, b.value_tag, b.value)) { | 
|  | matched = true; | 
|  | break; | 
|  | } | 
|  | } | 
|  | if (!matched) | 
|  | return false; | 
|  | } | 
|  |  | 
|  | // Every element in |a_type_and_values| had a matching element in | 
|  | // |b_type_and_values|. | 
|  | return true; | 
|  | } | 
|  |  | 
|  | }  // namespace | 
|  |  | 
|  | // |a| and |b| are ASN.1 RDNSequence values (not including the Sequence tag), | 
|  | // defined in RFC 5280 section 4.1.2.4: | 
|  | // | 
|  | // Name ::= CHOICE { -- only one possibility for now -- | 
|  | //   rdnSequence  RDNSequence } | 
|  | // | 
|  | // RDNSequence ::= SEQUENCE OF RelativeDistinguishedName | 
|  | // | 
|  | // RelativeDistinguishedName ::= | 
|  | //   SET SIZE (1..MAX) OF AttributeTypeAndValue | 
|  | bool VerifyNameMatch(const der::Input& a, const der::Input& b) { | 
|  | // Empty Names are allowed.  RFC 5280 section 4.1.2.4 requires "The issuer | 
|  | // field MUST contain a non-empty distinguished name (DN)", while section | 
|  | // 4.1.2.6 allows for the Subject to be empty in certain cases. The caller is | 
|  | // assumed to have verified those conditions. | 
|  |  | 
|  | // RFC 5280 section 7.1: | 
|  | // Two distinguished names DN1 and DN2 match if they have the same number of | 
|  | // RDNs, for each RDN in DN1 there is a matching RDN in DN2, and the matching | 
|  | // RDNs appear in the same order in both DNs. | 
|  |  | 
|  | // First just check if the inputs have the same number of RDNs: | 
|  | der::Parser a_rdn_sequence_counter(a); | 
|  | der::Parser b_rdn_sequence_counter(b); | 
|  | while (a_rdn_sequence_counter.HasMore() && b_rdn_sequence_counter.HasMore()) { | 
|  | if (!a_rdn_sequence_counter.SkipTag(der::kSet) || | 
|  | !b_rdn_sequence_counter.SkipTag(der::kSet)) { | 
|  | return false; | 
|  | } | 
|  | } | 
|  | if (a_rdn_sequence_counter.HasMore() || b_rdn_sequence_counter.HasMore()) | 
|  | return false; | 
|  |  | 
|  | // Same number of RDNs, now check if they match. | 
|  | der::Parser a_rdn_sequence(a); | 
|  | der::Parser b_rdn_sequence(b); | 
|  | while (a_rdn_sequence.HasMore() && b_rdn_sequence.HasMore()) { | 
|  | der::Parser a_rdn, b_rdn; | 
|  | if (!a_rdn_sequence.ReadConstructed(der::kSet, &a_rdn) || | 
|  | !b_rdn_sequence.ReadConstructed(der::kSet, &b_rdn)) { | 
|  | return false; | 
|  | } | 
|  | if (!VerifyRdnMatch(&a_rdn, &b_rdn)) | 
|  | return false; | 
|  | } | 
|  |  | 
|  | return true; | 
|  | } | 
|  |  | 
|  | }  // namespace net |