2020-01-18 03:38:21 -05:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
|
|
|
|
* All rights reserved.
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions are met:
|
|
|
|
*
|
|
|
|
* 1. Redistributions of source code must retain the above copyright notice, this
|
|
|
|
* list of conditions and the following disclaimer.
|
|
|
|
*
|
|
|
|
* 2. Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
* this list of conditions and the following disclaimer in the documentation
|
|
|
|
* and/or other materials provided with the distribution.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
|
|
|
* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
|
|
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
|
|
|
* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
|
|
|
|
* CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
|
|
|
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
2019-04-15 08:56:37 -04:00
|
|
|
#pragma once
|
|
|
|
|
2020-04-29 17:17:54 -04:00
|
|
|
#include <AK/Assertions.h>
|
|
|
|
#include <AK/Checked.h>
|
2020-02-14 15:41:10 -05:00
|
|
|
#include <AK/Forward.h>
|
2020-07-27 08:15:37 -04:00
|
|
|
#include <AK/Span.h>
|
2020-02-14 15:41:10 -05:00
|
|
|
#include <AK/StdLibExtras.h>
|
2020-02-26 02:25:24 -05:00
|
|
|
#include <AK/StringUtils.h>
|
2019-04-15 20:39:16 -04:00
|
|
|
|
|
|
|
namespace AK {
|
|
|
|
|
2019-04-15 08:56:37 -04:00
|
|
|
class StringView {
|
|
|
|
public:
|
2020-03-10 04:13:29 -04:00
|
|
|
using ConstIterator = const char*;
|
|
|
|
|
2020-05-30 10:06:30 -04:00
|
|
|
ALWAYS_INLINE constexpr StringView() { }
|
|
|
|
ALWAYS_INLINE constexpr StringView(const char* characters, size_t length)
|
2019-05-28 05:53:16 -04:00
|
|
|
: m_characters(characters)
|
|
|
|
, m_length(length)
|
|
|
|
{
|
2020-04-29 17:17:54 -04:00
|
|
|
ASSERT(!Checked<uintptr_t>::addition_would_overflow((uintptr_t)characters, length));
|
2019-05-28 05:53:16 -04:00
|
|
|
}
|
2020-04-30 05:43:25 -04:00
|
|
|
ALWAYS_INLINE StringView(const unsigned char* characters, size_t length)
|
2019-05-28 05:53:16 -04:00
|
|
|
: m_characters((const char*)characters)
|
|
|
|
, m_length(length)
|
|
|
|
{
|
2020-04-29 17:17:54 -04:00
|
|
|
ASSERT(!Checked<uintptr_t>::addition_would_overflow((uintptr_t)characters, length));
|
2019-05-28 05:53:16 -04:00
|
|
|
}
|
2020-05-30 10:06:30 -04:00
|
|
|
ALWAYS_INLINE constexpr StringView(const char* cstring)
|
2019-04-15 08:56:37 -04:00
|
|
|
: m_characters(cstring)
|
2020-03-08 07:34:33 -04:00
|
|
|
, m_length(cstring ? __builtin_strlen(cstring) : 0)
|
2019-04-15 08:56:37 -04:00
|
|
|
{
|
|
|
|
}
|
2020-08-19 05:43:41 -04:00
|
|
|
ALWAYS_INLINE StringView(ReadonlyBytes bytes)
|
|
|
|
: m_characters(reinterpret_cast<const char*>(bytes.data()))
|
|
|
|
, m_length(bytes.size())
|
|
|
|
{
|
|
|
|
}
|
2019-06-29 06:03:28 -04:00
|
|
|
|
|
|
|
StringView(const ByteBuffer&);
|
|
|
|
StringView(const String&);
|
2020-03-22 05:12:55 -04:00
|
|
|
StringView(const FlyString&);
|
2019-04-15 08:56:37 -04:00
|
|
|
|
2019-06-08 12:30:40 -04:00
|
|
|
bool is_null() const { return !m_characters; }
|
2019-04-15 08:56:37 -04:00
|
|
|
bool is_empty() const { return m_length == 0; }
|
2020-07-27 08:15:37 -04:00
|
|
|
|
2019-07-08 09:38:44 -04:00
|
|
|
const char* characters_without_null_termination() const { return m_characters; }
|
2019-12-09 11:45:40 -05:00
|
|
|
size_t length() const { return m_length; }
|
2020-07-27 08:15:37 -04:00
|
|
|
|
|
|
|
ReadonlyBytes bytes() const { return { m_characters, m_length }; }
|
|
|
|
|
2020-03-10 04:13:29 -04:00
|
|
|
const char& operator[](size_t index) const { return m_characters[index]; }
|
|
|
|
|
|
|
|
ConstIterator begin() const { return characters_without_null_termination(); }
|
|
|
|
ConstIterator end() const { return begin() + length(); }
|
2019-04-15 08:56:37 -04:00
|
|
|
|
2019-08-24 16:31:06 -04:00
|
|
|
unsigned hash() const;
|
|
|
|
|
2020-07-18 12:59:38 -04:00
|
|
|
bool starts_with(const StringView&, CaseSensitivity = CaseSensitivity::CaseSensitive) const;
|
2020-05-26 06:21:34 -04:00
|
|
|
bool ends_with(const StringView&, CaseSensitivity = CaseSensitivity::CaseSensitive) const;
|
2020-02-14 16:14:22 -05:00
|
|
|
bool starts_with(char) const;
|
|
|
|
bool ends_with(char) const;
|
2020-02-26 02:25:24 -05:00
|
|
|
bool matches(const StringView& mask, CaseSensitivity = CaseSensitivity::CaseInsensitive) const;
|
2020-04-17 09:04:40 -04:00
|
|
|
bool contains(char) const;
|
2020-07-04 14:04:00 -04:00
|
|
|
bool contains(const StringView&) const;
|
2020-05-13 12:59:31 -04:00
|
|
|
bool equals_ignoring_case(const StringView& other) const;
|
2019-09-12 07:13:07 -04:00
|
|
|
|
2020-05-02 14:21:20 -04:00
|
|
|
Optional<size_t> find_first_of(char) const;
|
|
|
|
Optional<size_t> find_first_of(const StringView&) const;
|
|
|
|
|
|
|
|
Optional<size_t> find_last_of(char) const;
|
|
|
|
Optional<size_t> find_last_of(const StringView&) const;
|
|
|
|
|
2019-12-09 11:45:40 -05:00
|
|
|
StringView substring_view(size_t start, size_t length) const;
|
2019-09-20 17:43:37 -04:00
|
|
|
Vector<StringView> split_view(char, bool keep_empty = false) const;
|
2020-05-27 16:21:43 -04:00
|
|
|
Vector<StringView> split_view(const StringView&, bool keep_empty = false) const;
|
2019-08-04 05:44:20 -04:00
|
|
|
|
2019-12-02 07:42:33 -05:00
|
|
|
// Create a Vector of StringViews split by line endings. As of CommonMark
|
|
|
|
// 0.29, the spec defines a line ending as "a newline (U+000A), a carriage
|
|
|
|
// return (U+000D) not followed by a newline, or a carriage return and a
|
|
|
|
// following newline.".
|
|
|
|
Vector<StringView> lines(bool consider_cr = true) const;
|
|
|
|
|
2020-06-12 15:07:52 -04:00
|
|
|
Optional<int> to_int() const;
|
|
|
|
Optional<unsigned> to_uint() const;
|
2019-04-15 20:39:16 -04:00
|
|
|
|
2019-06-13 09:30:55 -04:00
|
|
|
// Create a new substring view of this string view, starting either at the beginning of
|
|
|
|
// the given substring view, or after its end, and continuing until the end of this string
|
|
|
|
// view (that is, for the remaining part of its length). For example,
|
|
|
|
//
|
|
|
|
// StringView str { "foobar" };
|
|
|
|
// StringView substr = str.substring_view(1, 2); // "oo"
|
|
|
|
// StringView substr_from = str.substring_view_starting_from_substring(subst); // "oobar"
|
|
|
|
// StringView substr_after = str.substring_view_starting_after_substring(subst); // "bar"
|
|
|
|
//
|
|
|
|
// Note that this only works if the string view passed as an argument is indeed a substring
|
|
|
|
// view of this string view, such as one created by substring_view() and split_view(). It
|
|
|
|
// does not work for arbitrary strings; for example declaring substr in the example above as
|
|
|
|
//
|
|
|
|
// StringView substr { "oo" };
|
|
|
|
//
|
|
|
|
// would not work.
|
|
|
|
StringView substring_view_starting_from_substring(const StringView& substring) const;
|
|
|
|
StringView substring_view_starting_after_substring(const StringView& substring) const;
|
|
|
|
|
2019-06-07 13:22:58 -04:00
|
|
|
bool operator==(const char* cstring) const
|
|
|
|
{
|
2019-06-08 12:30:40 -04:00
|
|
|
if (is_null())
|
|
|
|
return !cstring;
|
|
|
|
if (!cstring)
|
|
|
|
return false;
|
2020-03-08 07:34:33 -04:00
|
|
|
size_t other_length = __builtin_strlen(cstring);
|
2019-06-07 13:22:58 -04:00
|
|
|
if (m_length != other_length)
|
|
|
|
return false;
|
2020-03-08 07:34:33 -04:00
|
|
|
return !__builtin_memcmp(m_characters, cstring, m_length);
|
2019-06-07 13:22:58 -04:00
|
|
|
}
|
|
|
|
bool operator!=(const char* cstring) const
|
|
|
|
{
|
|
|
|
return !(*this == cstring);
|
|
|
|
}
|
2019-04-15 20:39:16 -04:00
|
|
|
|
|
|
|
bool operator==(const String&) const;
|
|
|
|
|
2019-08-15 08:07:23 -04:00
|
|
|
bool operator==(const StringView& other) const
|
|
|
|
{
|
|
|
|
if (is_null())
|
|
|
|
return other.is_null();
|
|
|
|
if (other.is_null())
|
|
|
|
return false;
|
|
|
|
if (length() != other.length())
|
|
|
|
return false;
|
2020-03-08 07:34:33 -04:00
|
|
|
return !__builtin_memcmp(m_characters, other.m_characters, m_length);
|
2019-08-15 08:07:23 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
bool operator!=(const StringView& other) const
|
|
|
|
{
|
|
|
|
return !(*this == other);
|
|
|
|
}
|
|
|
|
|
2020-08-09 21:55:32 -04:00
|
|
|
bool operator<(const StringView& other) const
|
|
|
|
{
|
|
|
|
if (int c = __builtin_memcmp(m_characters, other.m_characters, min(m_length, other.m_length)))
|
|
|
|
return c < 0;
|
|
|
|
return m_length < other.m_length;
|
|
|
|
}
|
|
|
|
|
2020-03-22 08:07:45 -04:00
|
|
|
const StringImpl* impl() const { return m_impl; }
|
|
|
|
|
2020-05-06 12:53:05 -04:00
|
|
|
String to_string() const;
|
|
|
|
|
2020-06-07 14:53:30 -04:00
|
|
|
const char* begin() { return m_characters; }
|
|
|
|
const char* end() { return m_characters + m_length; }
|
|
|
|
|
2019-04-15 08:56:37 -04:00
|
|
|
private:
|
2019-06-03 12:27:56 -04:00
|
|
|
friend class String;
|
2019-06-08 17:55:13 -04:00
|
|
|
const StringImpl* m_impl { nullptr };
|
2019-04-15 08:56:37 -04:00
|
|
|
const char* m_characters { nullptr };
|
2019-12-09 11:45:40 -05:00
|
|
|
size_t m_length { 0 };
|
2019-04-15 08:56:37 -04:00
|
|
|
};
|
2019-04-15 20:39:16 -04:00
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
using AK::StringView;
|