1
Fork 0
mirror of https://github.com/RGBCube/serenity synced 2025-05-31 10:58:12 +00:00

LibWebView: Protect URL highlighting against partially-typed URLs

The current helpers assume that a valid URL is a full URL (i.e. contains
the "://" separator between the scheme and domain). This isn't true, as
"file:" alone is parsed as a valid URL.

We must also avoid simply searching for the parsed public suffix in the
original URL string. For example, "com" is a public suffix. If we search
for that in the URL "com.com", we will think the public suffix starts at
index 0.
This commit is contained in:
Timothy Flynn 2023-10-28 09:31:24 -04:00 committed by Andreas Kling
parent 194bf5a677
commit 8dc25dffc2
5 changed files with 113 additions and 15 deletions

View file

@ -107,27 +107,35 @@ static URLParts break_file_url_into_parts(URL const& url, StringView url_string)
static URLParts break_web_url_into_parts(URL const& url, StringView url_string)
{
auto host = MUST(url.serialized_host());
auto scheme = url_string.substring_view(0, url.scheme().bytes_as_string_view().length() + "://"sv.length());
auto url_without_scheme = url_string.substring_view(scheme.length());
auto public_suffix = get_public_suffix(host);
if (!public_suffix.has_value())
return {};
StringView domain;
StringView remainder;
auto public_suffix_start = url_string.find(*public_suffix);
auto public_suffix_end = public_suffix_start.value() + public_suffix->bytes_as_string_view().length();
if (auto index = url_without_scheme.find_any_of("/?#"sv); index.has_value()) {
domain = url_without_scheme.substring_view(0, *index);
remainder = url_without_scheme.substring_view(*index);
} else {
domain = url_without_scheme;
}
auto scheme_and_subdomain = url_string.substring_view(0, *public_suffix_start);
scheme_and_subdomain = scheme_and_subdomain.trim("."sv, TrimMode::Right);
auto public_suffix = get_public_suffix(domain);
if (!public_suffix.has_value() || !domain.ends_with(*public_suffix))
return { scheme, domain, remainder };
if (auto index = scheme_and_subdomain.find_last('.'); index.has_value())
scheme_and_subdomain = scheme_and_subdomain.substring_view(0, *index + 1);
else
scheme_and_subdomain = scheme_and_subdomain.substring_view(0, url.scheme().bytes_as_string_view().length() + "://"sv.length());
auto subdomain = domain.substring_view(0, domain.length() - public_suffix->bytes_as_string_view().length());
subdomain = subdomain.trim("."sv, TrimMode::Right);
auto effective_tld_plus_one = url_string.substring_view(scheme_and_subdomain.length(), public_suffix_end - scheme_and_subdomain.length());
auto remainder = url_string.substring_view(public_suffix_end);
if (auto index = subdomain.find_last('.'); index.has_value()) {
subdomain = subdomain.substring_view(0, *index + 1);
domain = domain.substring_view(subdomain.length());
} else {
subdomain = {};
}
return URLParts { scheme_and_subdomain, effective_tld_plus_one, remainder };
auto scheme_and_subdomain = url_string.substring_view(0, scheme.length() + subdomain.length());
return { scheme_and_subdomain, domain, remainder };
}
Optional<URLParts> break_url_into_parts(StringView url_string)
@ -136,6 +144,10 @@ Optional<URLParts> break_url_into_parts(StringView url_string)
if (!url.is_valid())
return {};
auto scheme_length = url.scheme().bytes_as_string_view().length();
if (!url_string.substring_view(scheme_length).starts_with("://"sv))
return {};
if (url.scheme() == "file"sv)
return break_file_url_into_parts(url, url_string);
if (url.scheme().is_one_of("http"sv, "https"sv, "gemini"sv))