2020-01-18 09:38:21 +01:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
|
|
|
|
*
|
2021-04-22 01:24:48 -07:00
|
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
2020-01-18 09:38:21 +01:00
|
|
|
*/
|
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
#pragma once
|
|
|
|
|
2020-09-23 13:21:18 +02:00
|
|
|
#include <AK/Format.h>
|
2020-02-14 21:41:10 +01:00
|
|
|
#include <AK/Forward.h>
|
2019-06-21 18:45:35 +02:00
|
|
|
#include <AK/RefPtr.h>
|
2020-08-05 12:14:44 +02:00
|
|
|
#include <AK/Stream.h>
|
2021-01-15 20:13:14 +01:00
|
|
|
#include <AK/StringBuilder.h>
|
2019-04-15 14:56:37 +02:00
|
|
|
#include <AK/StringImpl.h>
|
2020-02-26 15:25:24 +08:00
|
|
|
#include <AK/StringUtils.h>
|
2019-04-15 14:56:37 +02:00
|
|
|
#include <AK/Traits.h>
|
2018-10-10 11:53:07 +02:00
|
|
|
|
|
|
|
namespace AK {
|
|
|
|
|
2019-06-02 08:37:01 +02:00
|
|
|
// String is a convenience wrapper around StringImpl, suitable for passing
|
|
|
|
// around as a value type. It's basically the same as passing around a
|
2019-06-21 18:37:47 +02:00
|
|
|
// RefPtr<StringImpl>, with a bit of syntactic sugar.
|
2019-06-02 08:37:01 +02:00
|
|
|
//
|
|
|
|
// Note that StringImpl is an immutable object that cannot shrink or grow.
|
|
|
|
// Its allocation size is snugly tailored to the specific string it contains.
|
|
|
|
// Copying a String is very efficient, since the internal StringImpl is
|
2019-06-21 18:40:24 +02:00
|
|
|
// retainable and so copying only requires modifying the ref count.
|
2019-06-02 08:37:01 +02:00
|
|
|
//
|
|
|
|
// There are three main ways to construct a new String:
|
|
|
|
//
|
|
|
|
// s = String("some literal");
|
|
|
|
//
|
2021-04-21 23:45:08 +02:00
|
|
|
// s = String::formatted("{} little piggies", m_piggies);
|
2019-06-02 08:37:01 +02:00
|
|
|
//
|
|
|
|
// StringBuilder builder;
|
|
|
|
// builder.append("abc");
|
|
|
|
// builder.append("123");
|
|
|
|
// s = builder.to_string();
|
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
class String {
|
|
|
|
public:
|
2021-01-10 16:29:28 -07:00
|
|
|
~String() = default;
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2021-01-10 16:29:28 -07:00
|
|
|
String() = default;
|
2020-03-23 13:45:10 +01:00
|
|
|
String(const StringView&);
|
2019-04-15 14:56:37 +02:00
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
String(const String& other)
|
2019-07-11 15:45:11 +02:00
|
|
|
: m_impl(const_cast<String&>(other).m_impl)
|
2018-10-10 11:53:07 +02:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
String(String&& other)
|
2018-10-17 10:55:43 +02:00
|
|
|
: m_impl(move(other.m_impl))
|
2018-10-10 11:53:07 +02:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2018-11-07 00:19:35 +01:00
|
|
|
String(const char* cstring, ShouldChomp shouldChomp = NoChomp)
|
|
|
|
: m_impl(StringImpl::create(cstring, shouldChomp))
|
2018-10-10 11:53:07 +02:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2019-12-09 17:45:40 +01:00
|
|
|
String(const char* cstring, size_t length, ShouldChomp shouldChomp = NoChomp)
|
2018-11-07 00:19:35 +01:00
|
|
|
: m_impl(StringImpl::create(cstring, length, shouldChomp))
|
2018-10-10 11:53:07 +02:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2020-08-05 10:37:34 +02:00
|
|
|
explicit String(ReadonlyBytes bytes, ShouldChomp shouldChomp = NoChomp)
|
|
|
|
: m_impl(StringImpl::create(bytes, shouldChomp))
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
String(const StringImpl& impl)
|
|
|
|
: m_impl(const_cast<StringImpl&>(impl))
|
2019-04-12 14:43:44 +02:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
String(const StringImpl* impl)
|
|
|
|
: m_impl(const_cast<StringImpl*>(impl))
|
2018-10-10 11:53:07 +02:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2019-06-21 18:37:47 +02:00
|
|
|
String(RefPtr<StringImpl>&& impl)
|
2018-10-17 10:55:43 +02:00
|
|
|
: m_impl(move(impl))
|
2018-10-10 11:53:07 +02:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2019-06-21 18:37:47 +02:00
|
|
|
String(NonnullRefPtr<StringImpl>&& impl)
|
2019-02-25 16:04:08 +01:00
|
|
|
: m_impl(move(impl))
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2020-03-22 19:07:02 +01:00
|
|
|
String(const FlyString&);
|
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] static String repeated(char, size_t count);
|
2021-01-15 20:13:14 +01:00
|
|
|
|
2021-04-30 23:31:53 +02:00
|
|
|
[[nodiscard]] static String bijective_base_from(size_t value, unsigned base = 26, StringView map = {});
|
|
|
|
|
2021-01-15 20:13:14 +01:00
|
|
|
template<class SeparatorType, class CollectionType>
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] static String join(const SeparatorType& separator, const CollectionType& collection)
|
2021-01-15 20:13:14 +01:00
|
|
|
{
|
|
|
|
StringBuilder builder;
|
|
|
|
builder.join(separator, collection);
|
|
|
|
return builder.build();
|
|
|
|
}
|
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] bool matches(const StringView& mask, CaseSensitivity = CaseSensitivity::CaseInsensitive) const;
|
|
|
|
[[nodiscard]] bool matches(const StringView& mask, Vector<MaskSpan>&, CaseSensitivity = CaseSensitivity::CaseInsensitive) const;
|
2019-04-25 22:56:09 +02:00
|
|
|
|
2020-12-11 00:17:30 +11:00
|
|
|
template<typename T = int>
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] Optional<T> to_int() const;
|
2020-12-11 00:17:30 +11:00
|
|
|
template<typename T = unsigned>
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] Optional<T> to_uint() const;
|
2018-10-31 19:49:22 +01:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] String to_lowercase() const;
|
|
|
|
[[nodiscard]] String to_uppercase() const;
|
|
|
|
[[nodiscard]] String to_snakecase() const;
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] bool is_whitespace() const { return StringUtils::is_whitespace(*this); }
|
2021-01-03 02:56:02 +03:30
|
|
|
|
2020-09-20 18:05:04 +04:30
|
|
|
#ifndef KERNEL
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] String trim_whitespace(TrimMode mode = TrimMode::Both) const
|
2020-09-20 18:05:04 +04:30
|
|
|
{
|
|
|
|
return StringUtils::trim_whitespace(StringView { characters(), length() }, mode);
|
|
|
|
}
|
|
|
|
#endif
|
2020-05-11 01:43:33 +01:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] bool equals_ignoring_case(const StringView&) const;
|
2019-12-18 12:43:53 +01:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] bool contains(const StringView&, CaseSensitivity = CaseSensitivity::CaseSensitive) const;
|
|
|
|
[[nodiscard]] Optional<size_t> index_of(const String&, size_t start = 0) const;
|
2019-10-28 18:47:48 +01:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] Vector<String> split_limit(char separator, size_t limit, bool keep_empty = false) const;
|
|
|
|
[[nodiscard]] Vector<String> split(char separator, bool keep_empty = false) const;
|
2021-01-12 23:28:45 +03:30
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] Optional<size_t> find(char) const;
|
|
|
|
[[nodiscard]] Optional<size_t> find(const StringView&) const;
|
2021-01-12 23:28:45 +03:30
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] String substring(size_t start) const;
|
|
|
|
[[nodiscard]] String substring(size_t start, size_t length) const;
|
2019-04-16 02:39:16 +02:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] Vector<StringView> split_view(char separator, bool keep_empty = false) const;
|
|
|
|
[[nodiscard]] StringView substring_view(size_t start, size_t length) const;
|
|
|
|
[[nodiscard]] StringView substring_view(size_t start) const;
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] bool is_null() const { return !m_impl; }
|
|
|
|
[[nodiscard]] ALWAYS_INLINE bool is_empty() const { return length() == 0; }
|
|
|
|
[[nodiscard]] ALWAYS_INLINE size_t length() const { return m_impl ? m_impl->length() : 0; }
|
2020-08-23 12:56:46 +02:00
|
|
|
// Includes NUL-terminator, if non-nullptr.
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] ALWAYS_INLINE const char* characters() const { return m_impl ? m_impl->characters() : nullptr; }
|
2020-07-27 14:15:37 +02:00
|
|
|
|
2020-08-25 17:23:18 +03:00
|
|
|
[[nodiscard]] bool copy_characters_to_buffer(char* buffer, size_t buffer_size) const;
|
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] ALWAYS_INLINE ReadonlyBytes bytes() const
|
2021-01-10 16:29:28 -07:00
|
|
|
{
|
|
|
|
if (m_impl) {
|
|
|
|
return m_impl->bytes();
|
|
|
|
}
|
|
|
|
return {};
|
|
|
|
}
|
2020-07-27 14:15:37 +02:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] ALWAYS_INLINE const char& operator[](size_t i) const
|
2019-05-28 11:53:16 +02:00
|
|
|
{
|
|
|
|
return (*m_impl)[i];
|
|
|
|
}
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2020-09-06 21:14:08 +02:00
|
|
|
using ConstIterator = SimpleIterator<const String, const char>;
|
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] constexpr ConstIterator begin() const { return ConstIterator::begin(*this); }
|
|
|
|
[[nodiscard]] constexpr ConstIterator end() const { return ConstIterator::end(*this); }
|
2020-03-10 16:13:29 +08:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] bool starts_with(const StringView&, CaseSensitivity = CaseSensitivity::CaseSensitive) const;
|
|
|
|
[[nodiscard]] bool ends_with(const StringView&, CaseSensitivity = CaseSensitivity::CaseSensitive) const;
|
|
|
|
[[nodiscard]] bool starts_with(char) const;
|
|
|
|
[[nodiscard]] bool ends_with(char) const;
|
2019-03-22 12:43:29 +01:00
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
bool operator==(const String&) const;
|
|
|
|
bool operator!=(const String& other) const { return !(*this == other); }
|
2019-07-11 11:58:27 +01:00
|
|
|
|
2019-08-24 22:28:42 +02:00
|
|
|
bool operator==(const StringView&) const;
|
|
|
|
bool operator!=(const StringView& other) const { return !(*this == other); }
|
|
|
|
|
2020-03-28 09:11:00 +01:00
|
|
|
bool operator==(const FlyString&) const;
|
|
|
|
bool operator!=(const FlyString& other) const { return !(*this == other); }
|
|
|
|
|
2019-03-09 13:33:52 +01:00
|
|
|
bool operator<(const String&) const;
|
2019-07-04 14:20:48 +02:00
|
|
|
bool operator<(const char*) const;
|
|
|
|
bool operator>=(const String& other) const { return !(*this < other); }
|
|
|
|
bool operator>=(const char* other) const { return !(*this < other); }
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2019-07-11 11:58:27 +01:00
|
|
|
bool operator>(const String&) const;
|
|
|
|
bool operator>(const char*) const;
|
|
|
|
bool operator<=(const String& other) const { return !(*this > other); }
|
|
|
|
bool operator<=(const char* other) const { return !(*this > other); }
|
|
|
|
|
2020-03-23 13:45:10 +01:00
|
|
|
bool operator==(const char* cstring) const;
|
|
|
|
bool operator!=(const char* cstring) const { return !(*this == cstring); }
|
2019-06-08 18:30:40 +02:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] String isolated_copy() const;
|
2018-10-26 09:54:29 +02:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] static String empty();
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] StringImpl* impl() { return m_impl.ptr(); }
|
|
|
|
[[nodiscard]] const StringImpl* impl() const { return m_impl.ptr(); }
|
2018-10-10 11:53:07 +02:00
|
|
|
|
|
|
|
String& operator=(String&& other)
|
|
|
|
{
|
2018-10-24 14:28:22 +02:00
|
|
|
if (this != &other)
|
2018-10-17 10:55:43 +02:00
|
|
|
m_impl = move(other.m_impl);
|
2018-10-24 14:28:22 +02:00
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
String& operator=(const String& other)
|
|
|
|
{
|
|
|
|
if (this != &other)
|
2019-07-11 15:45:11 +02:00
|
|
|
m_impl = const_cast<String&>(other).m_impl;
|
2018-10-10 11:53:07 +02:00
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
2020-08-05 10:37:34 +02:00
|
|
|
String& operator=(std::nullptr_t)
|
|
|
|
{
|
|
|
|
m_impl = nullptr;
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
String& operator=(ReadonlyBytes bytes)
|
|
|
|
{
|
|
|
|
m_impl = StringImpl::create(bytes);
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] u32 hash() const
|
2019-10-18 17:17:47 +02:00
|
|
|
{
|
|
|
|
if (!m_impl)
|
|
|
|
return 0;
|
|
|
|
return m_impl->hash();
|
|
|
|
}
|
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] ByteBuffer to_byte_buffer() const;
|
2019-04-20 14:13:40 +02:00
|
|
|
|
|
|
|
template<typename BufferType>
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] static String copy(const BufferType& buffer, ShouldChomp should_chomp = NoChomp)
|
2019-04-20 14:13:40 +02:00
|
|
|
{
|
|
|
|
if (buffer.is_null())
|
2019-05-28 11:53:16 +02:00
|
|
|
return {};
|
2019-04-20 14:13:40 +02:00
|
|
|
if (buffer.is_empty())
|
|
|
|
return empty();
|
|
|
|
return String((const char*)buffer.data(), buffer.size(), should_chomp);
|
|
|
|
}
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] static String vformatted(StringView fmtstr, TypeErasedFormatParams);
|
2020-09-23 13:21:18 +02:00
|
|
|
|
|
|
|
template<typename... Parameters>
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] static String formatted(CheckedFormatString<Parameters...>&& fmtstr, const Parameters&... parameters)
|
2020-09-23 13:21:18 +02:00
|
|
|
{
|
2021-02-23 09:58:15 +03:30
|
|
|
return vformatted(fmtstr.view(), VariadicFormatParams { parameters... });
|
2020-09-23 13:21:18 +02:00
|
|
|
}
|
|
|
|
|
2020-12-30 04:59:14 -07:00
|
|
|
template<typename T>
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] static String number(T value) requires IsArithmetic<T>
|
2021-01-17 11:52:04 +03:30
|
|
|
{
|
|
|
|
return formatted("{}", value);
|
|
|
|
}
|
2019-01-30 16:28:51 +01:00
|
|
|
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] StringView view() const;
|
2019-04-15 14:56:37 +02:00
|
|
|
|
2020-10-02 22:14:37 +01:00
|
|
|
int replace(const String& needle, const String& replacement, bool all_occurrences = false);
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] String reverse() const;
|
2020-04-01 21:27:39 +02:00
|
|
|
|
2020-05-25 12:36:41 +02:00
|
|
|
template<typename T, typename... Rest>
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] bool is_one_of(const T& string, Rest... rest) const
|
2020-05-25 12:36:41 +02:00
|
|
|
{
|
2020-07-28 17:40:23 +02:00
|
|
|
if (*this == string)
|
2020-05-25 12:36:41 +02:00
|
|
|
return true;
|
|
|
|
return is_one_of(rest...);
|
|
|
|
}
|
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
private:
|
2021-04-21 21:35:08 +02:00
|
|
|
[[nodiscard]] bool is_one_of() const { return false; }
|
2020-05-29 21:44:06 +02:00
|
|
|
|
2019-06-21 18:37:47 +02:00
|
|
|
RefPtr<StringImpl> m_impl;
|
2018-10-10 11:53:07 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
template<>
|
2019-06-29 19:14:03 +02:00
|
|
|
struct Traits<String> : public GenericTraits<String> {
|
2018-10-10 11:53:07 +02:00
|
|
|
static unsigned hash(const String& s) { return s.impl() ? s.impl()->hash() : 0; }
|
|
|
|
};
|
|
|
|
|
2021-02-25 21:10:47 +01:00
|
|
|
struct CaseInsensitiveStringTraits : public Traits<String> {
|
2019-07-13 11:00:29 +02:00
|
|
|
static unsigned hash(const String& s) { return s.impl() ? s.to_lowercase().impl()->hash() : 0; }
|
|
|
|
static bool equals(const String& a, const String& b) { return a.to_lowercase() == b.to_lowercase(); }
|
|
|
|
};
|
|
|
|
|
2020-03-23 13:45:10 +01:00
|
|
|
bool operator<(const char*, const String&);
|
|
|
|
bool operator>=(const char*, const String&);
|
|
|
|
bool operator>(const char*, const String&);
|
|
|
|
bool operator<=(const char*, const String&);
|
2019-07-11 11:58:27 +01:00
|
|
|
|
2020-02-13 08:46:00 +01:00
|
|
|
String escape_html_entities(const StringView& html);
|
|
|
|
|
2020-09-23 13:21:18 +02:00
|
|
|
InputStream& operator>>(InputStream& stream, String& string);
|
2020-08-05 12:14:44 +02:00
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
}
|
|
|
|
|
2019-09-13 14:37:25 +02:00
|
|
|
using AK::CaseInsensitiveStringTraits;
|
2020-02-13 08:46:00 +01:00
|
|
|
using AK::escape_html_entities;
|
2020-03-10 16:13:29 +08:00
|
|
|
using AK::String;
|