2020-01-18 03:38:21 -05:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
|
2021-05-23 17:31:16 -04:00
|
|
|
* Copyright (c) 2021, Max Wipfli <mail@maxwipfli.ch>
|
2020-01-18 03:38:21 -05:00
|
|
|
*
|
2021-04-22 04:24:48 -04:00
|
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
2020-01-18 03:38:21 -05:00
|
|
|
*/
|
|
|
|
|
2019-08-10 11:27:56 -04:00
|
|
|
#pragma once
|
|
|
|
|
2019-09-06 09:34:26 -04:00
|
|
|
#include <AK/String.h>
|
2019-08-10 11:27:56 -04:00
|
|
|
#include <AK/StringView.h>
|
2021-11-10 05:05:21 -05:00
|
|
|
#include <AK/Vector.h>
|
2019-08-10 11:27:56 -04:00
|
|
|
|
|
|
|
namespace AK {
|
|
|
|
|
2021-05-25 15:32:20 -04:00
|
|
|
// NOTE: The member variables cannot contain any percent encoded sequences.
|
|
|
|
// The URL parser automatically decodes those sequences and the the serialize() method will re-encode them as necessary.
|
2019-08-10 11:27:56 -04:00
|
|
|
class URL {
|
2021-05-25 16:13:15 -04:00
|
|
|
friend class URLParser;
|
|
|
|
|
2019-08-10 11:27:56 -04:00
|
|
|
public:
|
2021-05-25 07:50:03 -04:00
|
|
|
enum class PercentEncodeSet {
|
|
|
|
C0Control,
|
|
|
|
Fragment,
|
|
|
|
Query,
|
|
|
|
SpecialQuery,
|
|
|
|
Path,
|
|
|
|
Userinfo,
|
|
|
|
Component,
|
|
|
|
ApplicationXWWWFormUrlencoded,
|
|
|
|
EncodeURI
|
|
|
|
};
|
|
|
|
|
2021-05-25 16:32:39 -04:00
|
|
|
enum class ExcludeFragment {
|
|
|
|
No,
|
|
|
|
Yes
|
|
|
|
};
|
|
|
|
|
2021-01-10 18:29:28 -05:00
|
|
|
URL() = default;
|
2021-11-10 18:55:02 -05:00
|
|
|
URL(StringView);
|
2021-06-01 04:58:27 -04:00
|
|
|
URL(String const& string)
|
2019-08-10 13:31:37 -04:00
|
|
|
: URL(string.view())
|
|
|
|
{
|
|
|
|
}
|
2019-08-10 11:27:56 -04:00
|
|
|
|
2021-09-13 15:42:48 -04:00
|
|
|
bool is_valid() const { return m_valid; }
|
2021-05-23 17:31:16 -04:00
|
|
|
|
2021-06-01 04:58:27 -04:00
|
|
|
String const& scheme() const { return m_scheme; }
|
|
|
|
String const& username() const { return m_username; }
|
|
|
|
String const& password() const { return m_password; }
|
|
|
|
String const& host() const { return m_host; }
|
|
|
|
Vector<String> const& paths() const { return m_paths; }
|
|
|
|
String const& query() const { return m_query; }
|
|
|
|
String const& fragment() const { return m_fragment; }
|
2021-09-13 16:12:16 -04:00
|
|
|
Optional<u16> port() const { return m_port; }
|
|
|
|
u16 port_or_default() const { return m_port.value_or(default_port_for_scheme(m_scheme)); }
|
2021-09-13 15:42:48 -04:00
|
|
|
bool cannot_be_a_base_url() const { return m_cannot_be_a_base_url; }
|
2021-09-13 15:46:31 -04:00
|
|
|
bool cannot_have_a_username_or_password_or_port() const { return m_host.is_null() || m_host.is_empty() || m_cannot_be_a_base_url || m_scheme == "file"sv; }
|
2019-08-10 11:27:56 -04:00
|
|
|
|
2021-05-25 16:05:01 -04:00
|
|
|
bool includes_credentials() const { return !m_username.is_empty() || !m_password.is_empty(); }
|
|
|
|
bool is_special() const { return is_special_scheme(m_scheme); }
|
|
|
|
|
2021-06-01 04:58:27 -04:00
|
|
|
void set_scheme(String);
|
|
|
|
void set_username(String);
|
|
|
|
void set_password(String);
|
|
|
|
void set_host(String);
|
2021-09-13 16:12:16 -04:00
|
|
|
void set_port(Optional<u16>);
|
2021-06-01 04:58:27 -04:00
|
|
|
void set_paths(Vector<String>);
|
|
|
|
void set_query(String);
|
|
|
|
void set_fragment(String);
|
|
|
|
void set_cannot_be_a_base_url(bool value) { m_cannot_be_a_base_url = value; }
|
2021-09-13 16:20:38 -04:00
|
|
|
void append_path(String path) { m_paths.append(move(path)); }
|
2019-10-05 04:14:42 -04:00
|
|
|
|
2021-05-25 15:32:20 -04:00
|
|
|
String path() const;
|
2020-05-05 17:56:35 -04:00
|
|
|
String basename() const;
|
2019-08-10 11:27:56 -04:00
|
|
|
|
2021-05-25 16:32:39 -04:00
|
|
|
String serialize(ExcludeFragment = ExcludeFragment::No) const;
|
|
|
|
String serialize_for_display() const;
|
2021-05-27 15:38:16 -04:00
|
|
|
String to_string() const { return serialize(); }
|
|
|
|
|
2021-09-13 15:18:14 -04:00
|
|
|
// HTML origin
|
|
|
|
String serialize_origin() const;
|
|
|
|
|
2021-06-01 04:58:27 -04:00
|
|
|
bool equals(URL const& other, ExcludeFragment = ExcludeFragment::No) const;
|
2021-05-27 15:38:16 -04:00
|
|
|
|
2021-06-01 04:58:27 -04:00
|
|
|
URL complete_url(String const&) const;
|
2019-11-18 16:04:39 -05:00
|
|
|
|
2020-04-26 16:48:54 -04:00
|
|
|
bool data_payload_is_base64() const { return m_data_payload_is_base64; }
|
2021-06-01 04:58:27 -04:00
|
|
|
String const& data_mime_type() const { return m_data_mime_type; }
|
|
|
|
String const& data_payload() const { return m_data_payload; }
|
2020-04-26 16:48:54 -04:00
|
|
|
|
2021-06-01 04:58:27 -04:00
|
|
|
static URL create_with_url_or_path(String const&);
|
|
|
|
static URL create_with_file_scheme(String const& path, String const& fragment = {}, String const& hostname = {});
|
2022-03-23 22:46:52 -04:00
|
|
|
static URL create_with_help_scheme(String const& path, String const& fragment = {}, String const& hostname = {});
|
2021-06-01 04:58:27 -04:00
|
|
|
static URL create_with_data(String mime_type, String payload, bool is_base64 = false) { return URL(move(mime_type), move(payload), is_base64); };
|
2021-05-25 16:05:01 -04:00
|
|
|
|
2021-11-10 18:55:02 -05:00
|
|
|
static bool scheme_requires_port(StringView);
|
|
|
|
static u16 default_port_for_scheme(StringView);
|
|
|
|
static bool is_special_scheme(StringView);
|
2020-04-18 16:02:04 -04:00
|
|
|
|
2022-04-09 12:34:49 -04:00
|
|
|
enum class SpaceAsPlus {
|
|
|
|
No,
|
|
|
|
Yes,
|
|
|
|
};
|
|
|
|
static String percent_encode(StringView input, PercentEncodeSet set = PercentEncodeSet::Userinfo, SpaceAsPlus = SpaceAsPlus::No);
|
2021-11-10 18:55:02 -05:00
|
|
|
static String percent_decode(StringView input);
|
2021-05-25 07:50:03 -04:00
|
|
|
|
2021-06-01 05:14:30 -04:00
|
|
|
bool operator==(URL const& other) const { return equals(other, ExcludeFragment::No); }
|
2020-06-01 15:50:07 -04:00
|
|
|
|
2022-04-09 18:48:15 -04:00
|
|
|
static bool code_point_is_in_percent_encode_set(u32 code_point, URL::PercentEncodeSet);
|
|
|
|
|
2019-08-10 11:27:56 -04:00
|
|
|
private:
|
2021-05-25 16:05:01 -04:00
|
|
|
URL(String&& data_mime_type, String&& data_payload, bool payload_is_base64)
|
|
|
|
: m_valid(true)
|
|
|
|
, m_scheme("data")
|
|
|
|
, m_data_payload_is_base64(payload_is_base64)
|
|
|
|
, m_data_mime_type(move(data_mime_type))
|
|
|
|
, m_data_payload(move(data_payload))
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2020-04-11 17:07:23 -04:00
|
|
|
bool compute_validity() const;
|
2021-05-25 16:32:39 -04:00
|
|
|
String serialize_data_url() const;
|
2019-08-10 11:27:56 -04:00
|
|
|
|
2022-04-08 09:20:30 -04:00
|
|
|
static void append_percent_encoded_if_necessary(StringBuilder&, u32 code_point, PercentEncodeSet set = PercentEncodeSet::Userinfo);
|
2021-05-25 07:50:03 -04:00
|
|
|
static void append_percent_encoded(StringBuilder&, u32 code_point);
|
|
|
|
|
2019-08-10 11:27:56 -04:00
|
|
|
bool m_valid { false };
|
2021-05-25 15:32:20 -04:00
|
|
|
|
2021-05-23 17:31:16 -04:00
|
|
|
String m_scheme;
|
2021-05-25 15:32:20 -04:00
|
|
|
String m_username;
|
|
|
|
String m_password;
|
2019-08-10 11:27:56 -04:00
|
|
|
String m_host;
|
2021-09-13 16:12:16 -04:00
|
|
|
// NOTE: If the port is the default port for the scheme, m_port should be empty.
|
|
|
|
Optional<u16> m_port;
|
2019-08-10 11:27:56 -04:00
|
|
|
String m_path;
|
2021-05-25 15:32:20 -04:00
|
|
|
Vector<String> m_paths;
|
2019-11-25 15:20:03 -05:00
|
|
|
String m_query;
|
2020-04-11 18:38:13 -04:00
|
|
|
String m_fragment;
|
2021-05-25 15:32:20 -04:00
|
|
|
|
|
|
|
bool m_cannot_be_a_base_url { false };
|
|
|
|
|
|
|
|
bool m_data_payload_is_base64 { false };
|
2020-04-26 16:48:54 -04:00
|
|
|
String m_data_mime_type;
|
|
|
|
String m_data_payload;
|
2019-08-10 11:27:56 -04:00
|
|
|
};
|
|
|
|
|
2020-10-04 07:29:47 -04:00
|
|
|
template<>
|
|
|
|
struct Formatter<URL> : Formatter<StringView> {
|
2021-11-15 19:15:21 -05:00
|
|
|
ErrorOr<void> format(FormatBuilder& builder, URL const& value)
|
2020-10-04 07:29:47 -04:00
|
|
|
{
|
2021-11-15 19:15:21 -05:00
|
|
|
return Formatter<StringView>::format(builder, value.serialize());
|
2020-10-04 07:29:47 -04:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2020-06-01 15:50:07 -04:00
|
|
|
template<>
|
|
|
|
struct Traits<URL> : public GenericTraits<URL> {
|
2021-06-01 04:58:27 -04:00
|
|
|
static unsigned hash(URL const& url) { return url.to_string().hash(); }
|
2020-06-01 15:50:07 -04:00
|
|
|
};
|
|
|
|
|
2020-05-16 13:35:39 -04:00
|
|
|
}
|