/* * Copyright (c) 2018-2021, Andreas Kling * Copyright (c) 2023, Liav A. * * SPDX-License-Identifier: BSD-2-Clause */ #include #include #include #include #include #include #include #include #ifndef KERNEL # include # include # include #endif namespace AK { inline ErrorOr StringBuilder::will_append(size_t size) { if (m_use_inline_capacity_only == UseInlineCapacityOnly::Yes) { VERIFY(m_buffer.capacity() == StringBuilder::inline_capacity); Checked current_pointer = m_buffer.size(); current_pointer += size; VERIFY(!current_pointer.has_overflow()); if (current_pointer <= StringBuilder::inline_capacity) { return {}; } return Error::from_errno(ENOMEM); } Checked needed_capacity = m_buffer.size(); needed_capacity += size; VERIFY(!needed_capacity.has_overflow()); // Prefer to completely use the existing capacity first if (needed_capacity <= m_buffer.capacity()) return {}; Checked expanded_capacity = needed_capacity; expanded_capacity *= 2; VERIFY(!expanded_capacity.has_overflow()); TRY(m_buffer.try_ensure_capacity(expanded_capacity.value())); return {}; } ErrorOr StringBuilder::create(size_t initial_capacity) { StringBuilder builder; TRY(builder.m_buffer.try_ensure_capacity(initial_capacity)); return builder; } StringBuilder::StringBuilder(size_t initial_capacity) { m_buffer.ensure_capacity(initial_capacity); } StringBuilder::StringBuilder(UseInlineCapacityOnly use_inline_capacity_only) : m_use_inline_capacity_only(use_inline_capacity_only) { } size_t StringBuilder::length() const { return m_buffer.size(); } bool StringBuilder::is_empty() const { return m_buffer.is_empty(); } void StringBuilder::trim(size_t count) { auto decrease_count = min(m_buffer.size(), count); m_buffer.resize(m_buffer.size() - decrease_count); } ErrorOr StringBuilder::try_append(StringView string) { if (string.is_empty()) return {}; TRY(will_append(string.length())); TRY(m_buffer.try_append(string.characters_without_null_termination(), string.length())); return {}; } ErrorOr StringBuilder::try_append(char ch) { TRY(will_append(1)); TRY(m_buffer.try_append(ch)); return {}; } ErrorOr StringBuilder::try_append_repeated(char ch, size_t n) { TRY(will_append(n)); for (size_t i = 0; i < n; ++i) TRY(try_append(ch)); return {}; } void StringBuilder::append(StringView string) { MUST(try_append(string)); } ErrorOr StringBuilder::try_append(char const* characters, size_t length) { return try_append(StringView { characters, length }); } void StringBuilder::append(char const* characters, size_t length) { MUST(try_append(characters, length)); } void StringBuilder::append(char ch) { MUST(try_append(ch)); } void StringBuilder::appendvf(char const* fmt, va_list ap) { printf_internal([this](char*&, char ch) { append(ch); }, nullptr, fmt, ap); } void StringBuilder::append_repeated(char ch, size_t n) { MUST(try_append_repeated(ch, n)); } ErrorOr StringBuilder::to_byte_buffer() const { return ByteBuffer::copy(data(), length()); } #ifndef KERNEL ByteString StringBuilder::to_byte_string() const { if (is_empty()) return ByteString::empty(); return ByteString((char const*)data(), length()); } ErrorOr StringBuilder::to_string() const { return String::from_utf8(string_view()); } String StringBuilder::to_string_without_validation() const { return String::from_utf8_without_validation(string_view().bytes()); } FlyString StringBuilder::to_fly_string_without_validation() const { return FlyString::from_utf8_without_validation(string_view().bytes()); } ErrorOr StringBuilder::to_fly_string() const { return FlyString::from_utf8(string_view()); } #endif u8* StringBuilder::data() { return m_buffer.data(); } u8 const* StringBuilder::data() const { return m_buffer.data(); } StringView StringBuilder::string_view() const { return StringView { data(), m_buffer.size() }; } void StringBuilder::clear() { m_buffer.clear(); } ErrorOr StringBuilder::try_append_code_point(u32 code_point) { auto nwritten = TRY(AK::UnicodeUtils::try_code_point_to_utf8(code_point, [this](char c) { return try_append(c); })); if (nwritten < 0) { TRY(try_append(0xef)); TRY(try_append(0xbf)); TRY(try_append(0xbd)); } return {}; } void StringBuilder::append_code_point(u32 code_point) { if (code_point <= 0x7f) { m_buffer.append(static_cast(code_point)); } else if (code_point <= 0x07ff) { (void)will_append(2); m_buffer.append(static_cast((((code_point >> 6) & 0x1f) | 0xc0))); m_buffer.append(static_cast((((code_point >> 0) & 0x3f) | 0x80))); } else if (code_point <= 0xffff) { (void)will_append(3); m_buffer.append(static_cast((((code_point >> 12) & 0x0f) | 0xe0))); m_buffer.append(static_cast((((code_point >> 6) & 0x3f) | 0x80))); m_buffer.append(static_cast((((code_point >> 0) & 0x3f) | 0x80))); } else if (code_point <= 0x10ffff) { (void)will_append(4); m_buffer.append(static_cast((((code_point >> 18) & 0x07) | 0xf0))); m_buffer.append(static_cast((((code_point >> 12) & 0x3f) | 0x80))); m_buffer.append(static_cast((((code_point >> 6) & 0x3f) | 0x80))); m_buffer.append(static_cast((((code_point >> 0) & 0x3f) | 0x80))); } else { (void)will_append(3); m_buffer.append(0xef); m_buffer.append(0xbf); m_buffer.append(0xbd); } } #ifndef KERNEL ErrorOr StringBuilder::try_append(Utf16View const& utf16_view) { // NOTE: This may under-allocate in the presence of surrogate pairs. // That's okay, appending will still grow the buffer as needed. TRY(will_append(utf16_view.length_in_code_units())); for (size_t i = 0; i < utf16_view.length_in_code_units();) { // OPTIMIZATION: Fast path for ASCII characters. auto code_unit = utf16_view.data()[i]; if (code_unit <= 0x7f) { append(static_cast(code_unit)); ++i; continue; } auto code_point = utf16_view.code_point_at(i); TRY(try_append_code_point(code_point)); i += (code_point > 0xffff ? 2 : 1); } return {}; } void StringBuilder::append(Utf16View const& utf16_view) { MUST(try_append(utf16_view)); } #endif ErrorOr StringBuilder::try_append(Utf32View const& utf32_view) { for (size_t i = 0; i < utf32_view.length(); ++i) { auto code_point = utf32_view.code_points()[i]; TRY(try_append_code_point(code_point)); } return {}; } void StringBuilder::append(Utf32View const& utf32_view) { MUST(try_append(utf32_view)); } void StringBuilder::append_as_lowercase(char ch) { if (ch >= 'A' && ch <= 'Z') append(ch + 0x20); else append(ch); } void StringBuilder::append_escaped_for_json(StringView string) { MUST(try_append_escaped_for_json(string)); } ErrorOr StringBuilder::try_append_escaped_for_json(StringView string) { for (auto ch : string) { switch (ch) { case '\b': TRY(try_append("\\b"sv)); break; case '\n': TRY(try_append("\\n"sv)); break; case '\t': TRY(try_append("\\t"sv)); break; case '\"': TRY(try_append("\\\""sv)); break; case '\\': TRY(try_append("\\\\"sv)); break; default: if (ch >= 0 && ch <= 0x1f) TRY(try_appendff("\\u{:04x}", ch)); else TRY(try_append(ch)); } } return {}; } }