2020-01-18 09:38:21 +01:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
|
|
|
|
* All rights reserved.
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions are met:
|
|
|
|
*
|
|
|
|
* 1. Redistributions of source code must retain the above copyright notice, this
|
|
|
|
* list of conditions and the following disclaimer.
|
|
|
|
*
|
|
|
|
* 2. Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
* this list of conditions and the following disclaimer in the documentation
|
|
|
|
* and/or other materials provided with the distribution.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
|
|
|
* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
|
|
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
|
|
|
* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
|
|
|
|
* CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
|
|
|
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
2019-09-06 15:34:26 +02:00
|
|
|
#include <AK/StdLibExtras.h>
|
|
|
|
#include <AK/String.h>
|
|
|
|
#include <AK/StringBuilder.h>
|
2020-02-14 21:41:10 +01:00
|
|
|
#include <AK/Vector.h>
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2019-12-30 14:52:04 +01:00
|
|
|
#ifndef KERNEL
|
2020-02-14 21:41:10 +01:00
|
|
|
# include <inttypes.h>
|
2019-12-30 14:52:04 +01:00
|
|
|
#endif
|
|
|
|
|
2019-10-28 18:47:48 +01:00
|
|
|
#ifdef KERNEL
|
|
|
|
extern "C" char* strstr(const char* haystack, const char* needle);
|
|
|
|
#endif
|
|
|
|
|
2019-12-18 12:43:53 +01:00
|
|
|
static inline char to_lowercase(char c)
|
|
|
|
{
|
|
|
|
if (c >= 'A' && c <= 'Z')
|
|
|
|
return c | 0x20;
|
|
|
|
return c;
|
|
|
|
}
|
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
namespace AK {
|
|
|
|
|
|
|
|
bool String::operator==(const String& other) const
|
|
|
|
{
|
|
|
|
if (!m_impl)
|
|
|
|
return !other.m_impl;
|
|
|
|
|
|
|
|
if (!other.m_impl)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (length() != other.length())
|
|
|
|
return false;
|
2019-05-26 03:08:36 +01:00
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
return !memcmp(characters(), other.characters(), length());
|
|
|
|
}
|
|
|
|
|
2019-08-24 22:28:42 +02:00
|
|
|
bool String::operator==(const StringView& other) const
|
|
|
|
{
|
|
|
|
if (!m_impl)
|
|
|
|
return !other.m_characters;
|
|
|
|
|
|
|
|
if (!other.m_characters)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (length() != other.length())
|
|
|
|
return false;
|
|
|
|
|
|
|
|
return !memcmp(characters(), other.characters_without_null_termination(), length());
|
|
|
|
}
|
|
|
|
|
2019-03-09 13:33:52 +01:00
|
|
|
bool String::operator<(const String& other) const
|
|
|
|
{
|
|
|
|
if (!m_impl)
|
|
|
|
return other.m_impl;
|
|
|
|
|
|
|
|
if (!other.m_impl)
|
|
|
|
return false;
|
|
|
|
|
2019-03-09 14:24:34 +01:00
|
|
|
return strcmp(characters(), other.characters()) < 0;
|
2019-03-09 13:33:52 +01:00
|
|
|
}
|
|
|
|
|
2019-10-19 20:50:55 +02:00
|
|
|
bool String::operator>(const String& other) const
|
|
|
|
{
|
|
|
|
if (!m_impl)
|
|
|
|
return other.m_impl;
|
|
|
|
|
|
|
|
if (!other.m_impl)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
return strcmp(characters(), other.characters()) > 0;
|
|
|
|
}
|
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
String String::empty()
|
|
|
|
{
|
2018-12-21 02:10:45 +01:00
|
|
|
return StringImpl::the_empty_stringimpl();
|
2018-10-10 11:53:07 +02:00
|
|
|
}
|
|
|
|
|
2018-12-21 02:10:45 +01:00
|
|
|
String String::isolated_copy() const
|
2018-10-26 09:54:29 +02:00
|
|
|
{
|
|
|
|
if (!m_impl)
|
2019-05-28 11:53:16 +02:00
|
|
|
return {};
|
2018-10-26 09:54:29 +02:00
|
|
|
if (!m_impl->length())
|
|
|
|
return empty();
|
|
|
|
char* buffer;
|
2018-12-21 02:10:45 +01:00
|
|
|
auto impl = StringImpl::create_uninitialized(length(), buffer);
|
2018-10-26 09:54:29 +02:00
|
|
|
memcpy(buffer, m_impl->characters(), m_impl->length());
|
|
|
|
return String(move(*impl));
|
|
|
|
}
|
|
|
|
|
2019-12-09 17:45:40 +01:00
|
|
|
String String::substring(size_t start, size_t length) const
|
2018-10-16 11:42:39 +02:00
|
|
|
{
|
2019-03-08 14:08:15 +01:00
|
|
|
if (!length)
|
2019-05-28 11:53:16 +02:00
|
|
|
return {};
|
2018-10-16 11:42:39 +02:00
|
|
|
ASSERT(m_impl);
|
|
|
|
ASSERT(start + length <= m_impl->length());
|
|
|
|
// FIXME: This needs some input bounds checking.
|
2019-04-16 02:39:16 +02:00
|
|
|
return { characters() + start, length };
|
|
|
|
}
|
|
|
|
|
2019-12-09 17:45:40 +01:00
|
|
|
StringView String::substring_view(size_t start, size_t length) const
|
2019-04-16 02:39:16 +02:00
|
|
|
{
|
|
|
|
ASSERT(m_impl);
|
|
|
|
ASSERT(start + length <= m_impl->length());
|
|
|
|
// FIXME: This needs some input bounds checking.
|
|
|
|
return { characters() + start, length };
|
2018-10-16 11:42:39 +02:00
|
|
|
}
|
|
|
|
|
2020-01-22 17:17:27 +03:00
|
|
|
Vector<String> String::split(char separator, bool keep_empty) const
|
2019-06-04 18:13:07 +10:00
|
|
|
{
|
2020-01-22 17:17:27 +03:00
|
|
|
return split_limit(separator, 0, keep_empty);
|
2019-06-04 18:13:07 +10:00
|
|
|
}
|
|
|
|
|
2020-01-22 17:17:27 +03:00
|
|
|
Vector<String> String::split_limit(char separator, size_t limit, bool keep_empty) const
|
2018-10-10 11:53:07 +02:00
|
|
|
{
|
2018-12-21 02:10:45 +01:00
|
|
|
if (is_empty())
|
2019-05-28 11:53:16 +02:00
|
|
|
return {};
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2018-10-16 11:42:39 +02:00
|
|
|
Vector<String> v;
|
2019-12-09 17:45:40 +01:00
|
|
|
size_t substart = 0;
|
2020-03-01 12:35:09 +01:00
|
|
|
for (size_t i = 0; i < length() && (v.size() + 1) != limit; ++i) {
|
2018-10-16 11:42:39 +02:00
|
|
|
char ch = characters()[i];
|
2018-10-10 11:53:07 +02:00
|
|
|
if (ch == separator) {
|
2019-12-09 17:45:40 +01:00
|
|
|
size_t sublen = i - substart;
|
2020-01-22 17:17:27 +03:00
|
|
|
if (sublen != 0 || keep_empty)
|
2018-10-16 11:42:39 +02:00
|
|
|
v.append(substring(substart, sublen));
|
|
|
|
substart = i + 1;
|
2018-10-10 11:53:07 +02:00
|
|
|
}
|
|
|
|
}
|
2019-12-09 17:45:40 +01:00
|
|
|
size_t taillen = length() - substart;
|
2020-01-22 17:17:27 +03:00
|
|
|
if (taillen != 0 || keep_empty)
|
2018-10-16 11:42:39 +02:00
|
|
|
v.append(substring(substart, taillen));
|
|
|
|
return v;
|
2018-10-10 11:53:07 +02:00
|
|
|
}
|
|
|
|
|
2019-09-21 00:43:37 +03:00
|
|
|
Vector<StringView> String::split_view(const char separator, bool keep_empty) const
|
2019-04-16 02:39:16 +02:00
|
|
|
{
|
|
|
|
if (is_empty())
|
2019-05-28 11:53:16 +02:00
|
|
|
return {};
|
2019-04-16 02:39:16 +02:00
|
|
|
|
|
|
|
Vector<StringView> v;
|
2019-12-09 17:45:40 +01:00
|
|
|
size_t substart = 0;
|
|
|
|
for (size_t i = 0; i < length(); ++i) {
|
2019-04-16 02:39:16 +02:00
|
|
|
char ch = characters()[i];
|
|
|
|
if (ch == separator) {
|
2019-12-09 17:45:40 +01:00
|
|
|
size_t sublen = i - substart;
|
2019-09-21 00:43:37 +03:00
|
|
|
if (sublen != 0 || keep_empty)
|
2019-04-16 02:39:16 +02:00
|
|
|
v.append(substring_view(substart, sublen));
|
|
|
|
substart = i + 1;
|
|
|
|
}
|
|
|
|
}
|
2019-12-09 17:45:40 +01:00
|
|
|
size_t taillen = length() - substart;
|
2019-09-21 00:43:37 +03:00
|
|
|
if (taillen != 0 || keep_empty)
|
2019-04-16 02:39:16 +02:00
|
|
|
v.append(substring_view(substart, taillen));
|
|
|
|
return v;
|
|
|
|
}
|
|
|
|
|
2018-12-21 02:10:45 +01:00
|
|
|
ByteBuffer String::to_byte_buffer() const
|
2018-10-10 11:53:07 +02:00
|
|
|
{
|
|
|
|
if (!m_impl)
|
|
|
|
return nullptr;
|
2019-07-03 21:17:35 +02:00
|
|
|
return ByteBuffer::copy(reinterpret_cast<const u8*>(characters()), length());
|
2018-10-10 11:53:07 +02:00
|
|
|
}
|
|
|
|
|
2019-04-19 01:05:59 +02:00
|
|
|
int String::to_int(bool& ok) const
|
|
|
|
{
|
2019-05-26 03:08:36 +01:00
|
|
|
bool negative = false;
|
|
|
|
int value = 0;
|
2019-12-09 17:45:40 +01:00
|
|
|
size_t i = 0;
|
2019-05-26 03:08:36 +01:00
|
|
|
|
2019-07-08 10:51:45 +02:00
|
|
|
if (is_empty()) {
|
2019-05-26 03:08:36 +01:00
|
|
|
ok = false;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (characters()[0] == '-') {
|
|
|
|
i++;
|
|
|
|
negative = true;
|
|
|
|
}
|
|
|
|
for (; i < length(); i++) {
|
|
|
|
if (characters()[i] < '0' || characters()[i] > '9') {
|
|
|
|
ok = false;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
value = value * 10;
|
|
|
|
value += characters()[i] - '0';
|
|
|
|
}
|
|
|
|
ok = true;
|
|
|
|
|
|
|
|
return negative ? -value : value;
|
2019-04-19 01:05:59 +02:00
|
|
|
}
|
|
|
|
|
2019-01-31 17:31:23 +01:00
|
|
|
unsigned String::to_uint(bool& ok) const
|
2018-10-31 19:49:22 +01:00
|
|
|
{
|
|
|
|
unsigned value = 0;
|
2019-12-09 17:45:40 +01:00
|
|
|
for (size_t i = 0; i < length(); ++i) {
|
2018-10-31 19:49:22 +01:00
|
|
|
if (characters()[i] < '0' || characters()[i] > '9') {
|
|
|
|
ok = false;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
value = value * 10;
|
|
|
|
value += characters()[i] - '0';
|
|
|
|
}
|
|
|
|
ok = true;
|
|
|
|
return value;
|
|
|
|
}
|
|
|
|
|
2020-02-05 19:07:53 +01:00
|
|
|
String String::number(unsigned long long value)
|
2019-09-11 18:58:33 +02:00
|
|
|
{
|
2019-12-30 14:52:04 +01:00
|
|
|
int size;
|
|
|
|
char buffer[32];
|
|
|
|
size = sprintf(buffer, "%llu", value);
|
|
|
|
return String(buffer, size);
|
2019-09-11 18:58:33 +02:00
|
|
|
}
|
|
|
|
|
2020-02-05 19:07:53 +01:00
|
|
|
String String::number(unsigned long value)
|
|
|
|
{
|
|
|
|
int size;
|
|
|
|
char buffer[32];
|
|
|
|
size = sprintf(buffer, "%lu", value);
|
|
|
|
return String(buffer, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
String String::number(unsigned value)
|
2019-07-03 14:56:27 +02:00
|
|
|
{
|
2019-12-30 14:52:04 +01:00
|
|
|
char buffer[32];
|
|
|
|
int size = sprintf(buffer, "%u", value);
|
|
|
|
return String(buffer, size);
|
2019-07-03 14:56:27 +02:00
|
|
|
}
|
|
|
|
|
2020-02-05 19:07:53 +01:00
|
|
|
String String::number(long long value)
|
|
|
|
{
|
|
|
|
char buffer[32];
|
|
|
|
int size = sprintf(buffer, "%lld", value);
|
|
|
|
return String(buffer, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
String String::number(long value)
|
|
|
|
{
|
|
|
|
char buffer[32];
|
|
|
|
int size = sprintf(buffer, "%ld", value);
|
|
|
|
return String(buffer, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
String String::number(int value)
|
2019-07-03 14:56:27 +02:00
|
|
|
{
|
2019-12-30 14:52:04 +01:00
|
|
|
char buffer[32];
|
|
|
|
int size = sprintf(buffer, "%d", value);
|
|
|
|
return String(buffer, size);
|
2019-07-03 14:56:27 +02:00
|
|
|
}
|
|
|
|
|
2019-01-30 16:28:51 +01:00
|
|
|
String String::format(const char* fmt, ...)
|
|
|
|
{
|
|
|
|
StringBuilder builder;
|
|
|
|
va_list ap;
|
|
|
|
va_start(ap, fmt);
|
|
|
|
builder.appendvf(fmt, ap);
|
|
|
|
va_end(ap);
|
2019-01-31 17:31:23 +01:00
|
|
|
return builder.to_string();
|
2019-01-30 16:28:51 +01:00
|
|
|
}
|
|
|
|
|
2019-06-04 21:53:25 +10:00
|
|
|
bool String::starts_with(const StringView& str) const
|
|
|
|
{
|
|
|
|
if (str.is_empty())
|
|
|
|
return true;
|
|
|
|
if (is_empty())
|
|
|
|
return false;
|
|
|
|
if (str.length() > length())
|
|
|
|
return false;
|
2019-07-08 15:38:44 +02:00
|
|
|
return !memcmp(characters(), str.characters_without_null_termination(), str.length());
|
2019-06-04 21:53:25 +10:00
|
|
|
}
|
|
|
|
|
2020-02-15 13:04:00 +13:00
|
|
|
bool String::starts_with(char ch) const
|
|
|
|
{
|
|
|
|
if (is_empty())
|
|
|
|
return false;
|
|
|
|
return characters()[0] == ch;
|
|
|
|
}
|
|
|
|
|
2019-06-02 12:26:28 +02:00
|
|
|
bool String::ends_with(const StringView& str) const
|
2019-03-22 12:43:29 +01:00
|
|
|
{
|
|
|
|
if (str.is_empty())
|
|
|
|
return true;
|
|
|
|
if (is_empty())
|
|
|
|
return false;
|
|
|
|
if (str.length() > length())
|
|
|
|
return false;
|
2019-07-08 15:38:44 +02:00
|
|
|
return !memcmp(characters() + (length() - str.length()), str.characters_without_null_termination(), str.length());
|
2019-03-22 12:43:29 +01:00
|
|
|
}
|
|
|
|
|
2020-02-15 13:04:00 +13:00
|
|
|
bool String::ends_with(char ch) const
|
|
|
|
{
|
|
|
|
if (is_empty())
|
|
|
|
return false;
|
|
|
|
return characters()[length() - 1] == ch;
|
|
|
|
}
|
2019-12-09 17:45:40 +01:00
|
|
|
String String::repeated(char ch, size_t count)
|
2019-04-25 22:56:09 +02:00
|
|
|
{
|
|
|
|
if (!count)
|
|
|
|
return empty();
|
|
|
|
char* buffer;
|
|
|
|
auto impl = StringImpl::create_uninitialized(count, buffer);
|
|
|
|
memset(buffer, ch, count);
|
|
|
|
return *impl;
|
|
|
|
}
|
|
|
|
|
2019-06-02 12:26:28 +02:00
|
|
|
bool String::matches(const StringView& mask, CaseSensitivity case_sensitivity) const
|
2019-05-26 20:36:16 +02:00
|
|
|
{
|
2020-02-26 15:25:24 +08:00
|
|
|
return StringUtils::matches(*this, mask, case_sensitivity);
|
2019-05-26 20:36:16 +02:00
|
|
|
}
|
|
|
|
|
2019-10-28 18:47:48 +01:00
|
|
|
bool String::contains(const String& needle) const
|
|
|
|
{
|
|
|
|
return strstr(characters(), needle.characters());
|
|
|
|
}
|
|
|
|
|
2019-12-18 12:43:53 +01:00
|
|
|
bool String::equals_ignoring_case(const StringView& other) const
|
|
|
|
{
|
|
|
|
if (other.m_impl == impl())
|
|
|
|
return true;
|
|
|
|
if (length() != other.length())
|
|
|
|
return false;
|
|
|
|
for (size_t i = 0; i < length(); ++i) {
|
|
|
|
if (::to_lowercase(characters()[i]) != ::to_lowercase(other.characters_without_null_termination()[i]))
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
return true;
|
2018-10-10 11:53:07 +02:00
|
|
|
}
|
2019-10-28 18:47:48 +01:00
|
|
|
|
2020-02-13 08:46:00 +01:00
|
|
|
String escape_html_entities(const StringView& html)
|
|
|
|
{
|
|
|
|
StringBuilder builder;
|
|
|
|
for (size_t i = 0; i < html.length(); ++i) {
|
|
|
|
if (html[i] == '<')
|
|
|
|
builder.append("<");
|
|
|
|
else if (html[i] == '>')
|
|
|
|
builder.append(">");
|
|
|
|
else if (html[i] == '&')
|
|
|
|
builder.append("&");
|
|
|
|
else
|
|
|
|
builder.append(html[i]);
|
|
|
|
}
|
|
|
|
return builder.to_string();
|
2019-12-18 12:43:53 +01:00
|
|
|
}
|
2019-12-30 14:52:04 +01:00
|
|
|
|
2020-02-13 08:46:00 +01:00
|
|
|
}
|