Avi Drissman | 4e1b7bc3 | 2022-09-15 14:03:50 | [diff] [blame] | 1 | // Copyright 2017 The Chromium Authors |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 2 | // Use of this source code is governed by a BSD-style license that can be |
| 3 | // found in the LICENSE file. |
| 4 | |
| 5 | #include "content/browser/isolated_origin_util.h" |
| 6 | |
Md Hasibul Hasan | a963a934 | 2024-04-03 10:15:14 | [diff] [blame] | 7 | #include <string> |
| 8 | #include <string_view> |
| 9 | |
Hans Wennborg | f95d569 | 2020-04-22 17:43:31 | [diff] [blame] | 10 | #include "base/logging.h" |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 11 | #include "base/strings/string_util.h" |
| 12 | #include "net/base/registry_controlled_domains/registry_controlled_domain.h" |
Domenic Denicola | 4d1145d | 2020-10-29 15:05:33 | [diff] [blame] | 13 | #include "services/network/public/cpp/is_potentially_trustworthy.h" |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 14 | #include "url/gurl.h" |
| 15 | |
Andrew Stone | 404880d | 2019-07-10 02:23:31 | [diff] [blame] | 16 | const char* kAllSubdomainsWildcard = "[*.]"; |
Andrew Stone | 6ed99b2 | 2019-06-07 06:14:39 | [diff] [blame] | 17 | |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 18 | namespace content { |
| 19 | |
Md Hasibul Hasan | a963a934 | 2024-04-03 10:15:14 | [diff] [blame] | 20 | IsolatedOriginPattern::IsolatedOriginPattern(std::string_view pattern) |
Andrew Stone | 6ed99b2 | 2019-06-07 06:14:39 | [diff] [blame] | 21 | : isolate_all_subdomains_(false), is_valid_(false) { |
| 22 | Parse(pattern); |
| 23 | } |
| 24 | |
| 25 | IsolatedOriginPattern::IsolatedOriginPattern(const url::Origin& origin) |
| 26 | : IsolatedOriginPattern(origin.GetURL().spec()) {} |
| 27 | |
| 28 | IsolatedOriginPattern::~IsolatedOriginPattern() = default; |
| 29 | IsolatedOriginPattern::IsolatedOriginPattern( |
| 30 | const IsolatedOriginPattern& other) = default; |
| 31 | IsolatedOriginPattern& IsolatedOriginPattern::operator=( |
| 32 | const IsolatedOriginPattern& other) = default; |
| 33 | IsolatedOriginPattern::IsolatedOriginPattern(IsolatedOriginPattern&& other) = |
| 34 | default; |
| 35 | IsolatedOriginPattern& IsolatedOriginPattern::operator=( |
| 36 | IsolatedOriginPattern&& other) = default; |
| 37 | |
Md Hasibul Hasan | a963a934 | 2024-04-03 10:15:14 | [diff] [blame] | 38 | bool IsolatedOriginPattern::Parse(const std::string_view& unparsed_pattern) { |
Peter Kasting | b53b8191 | 2021-04-28 19:23:30 | [diff] [blame] | 39 | pattern_ = std::string(unparsed_pattern); |
Andrew Stone | 6ed99b2 | 2019-06-07 06:14:39 | [diff] [blame] | 40 | origin_ = url::Origin(); |
| 41 | isolate_all_subdomains_ = false; |
| 42 | is_valid_ = false; |
| 43 | |
| 44 | size_t host_begin = unparsed_pattern.find(url::kStandardSchemeSeparator); |
Md Hasibul Hasan | a963a934 | 2024-04-03 10:15:14 | [diff] [blame] | 45 | if (host_begin == std::string_view::npos || host_begin == 0) { |
Andrew Stone | 6ed99b2 | 2019-06-07 06:14:39 | [diff] [blame] | 46 | return false; |
Md Hasibul Hasan | a963a934 | 2024-04-03 10:15:14 | [diff] [blame] | 47 | } |
Andrew Stone | 6ed99b2 | 2019-06-07 06:14:39 | [diff] [blame] | 48 | |
| 49 | // Skip over the scheme separator. |
| 50 | host_begin += strlen(url::kStandardSchemeSeparator); |
| 51 | if (host_begin >= unparsed_pattern.size()) |
| 52 | return false; |
| 53 | |
Md Hasibul Hasan | a963a934 | 2024-04-03 10:15:14 | [diff] [blame] | 54 | std::string_view scheme_part = unparsed_pattern.substr(0, host_begin); |
| 55 | std::string_view host_part = unparsed_pattern.substr(host_begin); |
Andrew Stone | 6ed99b2 | 2019-06-07 06:14:39 | [diff] [blame] | 56 | |
| 57 | // Empty schemes or hosts are invalid for isolation purposes. |
| 58 | if (host_part.size() == 0) |
| 59 | return false; |
| 60 | |
Jan Wilken Dörrie | f05bb10 | 2020-08-18 19:35:56 | [diff] [blame] | 61 | if (base::StartsWith(host_part, kAllSubdomainsWildcard)) { |
Andrew Stone | 6ed99b2 | 2019-06-07 06:14:39 | [diff] [blame] | 62 | isolate_all_subdomains_ = true; |
| 63 | host_part.remove_prefix(strlen(kAllSubdomainsWildcard)); |
| 64 | } |
| 65 | |
| 66 | GURL conformant_url(base::JoinString({scheme_part, host_part}, "")); |
| 67 | origin_ = url::Origin::Create(conformant_url); |
| 68 | |
| 69 | // Ports are ignored when matching isolated origins (see also |
| 70 | // https://crbug.com/914511). |
| 71 | const std::string& scheme = origin_.scheme(); |
Scott Violet | a02c94b14 | 2024-08-28 03:29:18 | [diff] [blame] | 72 | int default_port = url::DefaultPortForScheme(scheme); |
Andrew Stone | 6ed99b2 | 2019-06-07 06:14:39 | [diff] [blame] | 73 | if (origin_.port() != default_port) { |
| 74 | LOG(ERROR) << "Ignoring port number in isolated origin: " << origin_; |
| 75 | origin_ = url::Origin::Create(GURL( |
| 76 | origin_.scheme() + url::kStandardSchemeSeparator + origin_.host())); |
| 77 | } |
| 78 | |
| 79 | // Can't isolate subdomains of an IP address, must be a valid isolated origin |
| 80 | // after processing. |
| 81 | if ((conformant_url.HostIsIPAddress() && isolate_all_subdomains_) || |
| 82 | !IsolatedOriginUtil::IsValidIsolatedOrigin(origin_)) { |
| 83 | origin_ = url::Origin(); |
| 84 | isolate_all_subdomains_ = false; |
| 85 | return false; |
| 86 | } |
| 87 | |
Andrew Stone | 0a177fe2 | 2019-06-26 08:12:04 | [diff] [blame] | 88 | DCHECK(!is_valid_ || !origin_.opaque()); |
Andrew Stone | 6ed99b2 | 2019-06-07 06:14:39 | [diff] [blame] | 89 | is_valid_ = true; |
| 90 | return true; |
| 91 | } |
| 92 | |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 93 | // static |
| 94 | bool IsolatedOriginUtil::DoesOriginMatchIsolatedOrigin( |
| 95 | const url::Origin& origin, |
| 96 | const url::Origin& isolated_origin) { |
| 97 | // Don't match subdomains if the isolated origin is an IP address. |
| 98 | if (isolated_origin.GetURL().HostIsIPAddress()) |
| 99 | return origin == isolated_origin; |
| 100 | |
Lukasz Anforowicz | 2542093 | 2018-12-18 20:59:22 | [diff] [blame] | 101 | // Compare scheme and hostname, but don't compare ports - see |
| 102 | // https://crbug.com/914511. |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 103 | if (origin.scheme() != isolated_origin.scheme()) |
| 104 | return false; |
| 105 | |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 106 | // Subdomains of an isolated origin are considered to be in the same isolated |
| 107 | // origin. |
| 108 | return origin.DomainIs(isolated_origin.host()); |
| 109 | } |
| 110 | |
| 111 | // static |
| 112 | bool IsolatedOriginUtil::IsValidIsolatedOrigin(const url::Origin& origin) { |
W. James MacLean | d8d31f0f | 2023-05-26 19:15:57 | [diff] [blame] | 113 | return IsValidIsolatedOriginImpl(origin, |
| 114 | /* is_legacy_isolated_origin_check=*/true); |
Domenic Denicola | 4d1145d | 2020-10-29 15:05:33 | [diff] [blame] | 115 | } |
| 116 | |
| 117 | // static |
| 118 | bool IsolatedOriginUtil::IsValidOriginForOptInIsolation( |
| 119 | const url::Origin& origin) { |
| 120 | // Per https://html.spec.whatwg.org/C/#initialise-the-document-object, |
| 121 | // non-secure contexts cannot be isolated via opt-in origin isolation. |
W. James MacLean | d8d31f0f | 2023-05-26 19:15:57 | [diff] [blame] | 122 | return IsValidIsolatedOriginImpl( |
| 123 | origin, /* is_legacy_isolated_origin_check=*/false) && |
Domenic Denicola | 4d1145d | 2020-10-29 15:05:33 | [diff] [blame] | 124 | network::IsOriginPotentiallyTrustworthy(origin); |
| 125 | } |
| 126 | |
| 127 | // static |
W. James MacLean | c07dc41b | 2022-07-25 18:52:16 | [diff] [blame] | 128 | bool IsolatedOriginUtil::IsValidOriginForOptOutIsolation( |
| 129 | const url::Origin& origin) { |
| 130 | // Per https://html.spec.whatwg.org/C/#initialise-the-document-object, |
| 131 | // non-secure contexts cannot be isolated via opt-in origin isolation, |
| 132 | // but we allow non-secure contexts to opt-out for legacy sites. |
W. James MacLean | d8d31f0f | 2023-05-26 19:15:57 | [diff] [blame] | 133 | return IsValidIsolatedOriginImpl(origin, |
| 134 | /* is_legacy_isolated_origin_check=*/false); |
W. James MacLean | c07dc41b | 2022-07-25 18:52:16 | [diff] [blame] | 135 | } |
| 136 | |
| 137 | // static |
Domenic Denicola | 4d1145d | 2020-10-29 15:05:33 | [diff] [blame] | 138 | bool IsolatedOriginUtil::IsValidIsolatedOriginImpl( |
| 139 | const url::Origin& origin, |
W. James MacLean | d8d31f0f | 2023-05-26 19:15:57 | [diff] [blame] | 140 | bool is_legacy_isolated_origin_check) { |
Chris Palmer | ab5e5b5 | 2018-09-28 19:19:30 | [diff] [blame] | 141 | if (origin.opaque()) |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 142 | return false; |
| 143 | |
| 144 | // Isolated origins should have HTTP or HTTPS schemes. Hosts in other |
| 145 | // schemes may not be compatible with subdomain matching. |
| 146 | GURL origin_gurl = origin.GetURL(); |
| 147 | if (!origin_gurl.SchemeIsHTTPOrHTTPS()) |
| 148 | return false; |
| 149 | |
| 150 | // IP addresses are allowed. |
| 151 | if (origin_gurl.HostIsIPAddress()) |
| 152 | return true; |
| 153 | |
| 154 | // Disallow hosts such as http://co.uk/, which don't have a valid |
| 155 | // registry-controlled domain. This prevents subdomain matching from |
| 156 | // grouping unrelated sites on a registry into the same origin. |
Domenic Denicola | 4d1145d | 2020-10-29 15:05:33 | [diff] [blame] | 157 | // |
| 158 | // This is not relevant for opt-in origin isolation, which doesn't need to |
| 159 | // match subdomains. (And it'd be bad to check this in that case, as it |
| 160 | // prohibits http://localhost/; see https://crbug.com/1142894.) |
W. James MacLean | d8d31f0f | 2023-05-26 19:15:57 | [diff] [blame] | 161 | if (is_legacy_isolated_origin_check) { |
Domenic Denicola | 4d1145d | 2020-10-29 15:05:33 | [diff] [blame] | 162 | const bool has_registry_domain = |
| 163 | net::registry_controlled_domains::HostHasRegistryControlledDomain( |
| 164 | origin.host(), |
| 165 | net::registry_controlled_domains::INCLUDE_UNKNOWN_REGISTRIES, |
| 166 | net::registry_controlled_domains::INCLUDE_PRIVATE_REGISTRIES); |
| 167 | if (!has_registry_domain) |
| 168 | return false; |
| 169 | } |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 170 | |
W. James MacLean | d8d31f0f | 2023-05-26 19:15:57 | [diff] [blame] | 171 | // Disallow hosts with a trailing dot for legacy isolated origins, but allow |
| 172 | // them for opt-in origin isolation since the spec says that they represent |
| 173 | // a distinct origin: https://url.spec.whatwg.org/#concept-domain. |
| 174 | // TODO(alexmos): Legacy isolated origins should probably support trailing |
| 175 | // dots as well, but enabling this would require carefully thinking about |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 176 | // whether hosts without a trailing dot should match it. |
W. James MacLean | d8d31f0f | 2023-05-26 19:15:57 | [diff] [blame] | 177 | if (is_legacy_isolated_origin_check && origin.host().back() == '.') { |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 178 | return false; |
W. James MacLean | d8d31f0f | 2023-05-26 19:15:57 | [diff] [blame] | 179 | } |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 180 | |
| 181 | return true; |
| 182 | } |
| 183 | |
alexmos | 4bc2632 | 2017-07-01 00:57:14 | [diff] [blame] | 184 | } // namespace content |