AK: Do not trim away non-ASCII bytes when parsing URL

Because non-ASCII code points have negative byte values, trimming away control characters requires checking for negative bytes values. This also adds a test case with a URL containing non-ASCII code points.
2025-09-16 19:26:17 +00:00 · 2021-06-03 12:36:02 +02:00 · 2021-06-03 12:36:02 +02:00 · 99d5555134
commit 99d5555134
parent 44937e2dfc
2 changed files with 11 additions and 2 deletions
--- a/Tests/AK/TestURL.cpp
+++ b/Tests/AK/TestURL.cpp
@ -328,3 +328,12 @@ TEST_CASE(leading_and_trailing_whitespace)
    EXPECT(url.is_valid());
    EXPECT_EQ(url.to_string(), "https://foo.com/");
 }
+
+TEST_CASE(unicode)
+{
+    URL url { "http://example.com/_ünicöde_téxt_©" };
+    EXPECT(url.is_valid());
+    EXPECT_EQ(url.path(), "/_ünicöde_téxt_©");
+    EXPECT(url.query().is_null());
+    EXPECT(url.fragment().is_null());
+}