2020-01-18 11:38:21 +03:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
|
|
|
|
* All rights reserved.
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions are met:
|
|
|
|
*
|
|
|
|
* 1. Redistributions of source code must retain the above copyright notice, this
|
|
|
|
* list of conditions and the following disclaimer.
|
|
|
|
*
|
|
|
|
* 2. Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
* this list of conditions and the following disclaimer in the documentation
|
|
|
|
* and/or other materials provided with the distribution.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
|
|
|
* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
|
|
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
|
|
|
* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
|
|
|
|
* CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
|
|
|
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
2021-01-15 01:48:01 +03:00
|
|
|
#include <AK/AnyOf.h>
|
2020-02-14 23:41:10 +03:00
|
|
|
#include <AK/ByteBuffer.h>
|
2021-01-15 01:48:01 +03:00
|
|
|
#include <AK/Find.h>
|
2020-04-17 16:04:40 +03:00
|
|
|
#include <AK/FlyString.h>
|
2020-03-08 14:34:33 +03:00
|
|
|
#include <AK/Memory.h>
|
2019-09-06 16:34:26 +03:00
|
|
|
#include <AK/String.h>
|
2019-05-28 12:53:16 +03:00
|
|
|
#include <AK/StringView.h>
|
2020-02-14 23:41:10 +03:00
|
|
|
#include <AK/Vector.h>
|
2019-04-16 03:39:16 +03:00
|
|
|
|
|
|
|
namespace AK {
|
|
|
|
|
2019-06-09 00:55:13 +03:00
|
|
|
StringView::StringView(const String& string)
|
|
|
|
: m_impl(string.impl())
|
2019-06-03 19:27:56 +03:00
|
|
|
, m_characters(string.characters())
|
2019-06-02 13:19:21 +03:00
|
|
|
, m_length(string.length())
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2020-03-22 12:12:55 +03:00
|
|
|
StringView::StringView(const FlyString& string)
|
|
|
|
: m_impl(string.impl())
|
|
|
|
, m_characters(string.characters())
|
|
|
|
, m_length(string.length())
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2019-06-29 13:03:28 +03:00
|
|
|
StringView::StringView(const ByteBuffer& buffer)
|
|
|
|
: m_characters((const char*)buffer.data())
|
2020-03-01 14:35:09 +03:00
|
|
|
, m_length(buffer.size())
|
2019-06-29 13:03:28 +03:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2019-09-21 00:43:37 +03:00
|
|
|
Vector<StringView> StringView::split_view(const char separator, bool keep_empty) const
|
2019-04-16 03:39:16 +03:00
|
|
|
{
|
|
|
|
if (is_empty())
|
2019-05-28 12:53:16 +03:00
|
|
|
return {};
|
2019-04-16 03:39:16 +03:00
|
|
|
|
|
|
|
Vector<StringView> v;
|
2019-12-09 19:45:40 +03:00
|
|
|
size_t substart = 0;
|
|
|
|
for (size_t i = 0; i < length(); ++i) {
|
2019-07-08 16:38:44 +03:00
|
|
|
char ch = characters_without_null_termination()[i];
|
2019-04-16 03:39:16 +03:00
|
|
|
if (ch == separator) {
|
2019-12-09 19:45:40 +03:00
|
|
|
size_t sublen = i - substart;
|
2019-09-21 00:43:37 +03:00
|
|
|
if (sublen != 0 || keep_empty)
|
2019-04-16 03:39:16 +03:00
|
|
|
v.append(substring_view(substart, sublen));
|
|
|
|
substart = i + 1;
|
|
|
|
}
|
|
|
|
}
|
2019-12-09 19:45:40 +03:00
|
|
|
size_t taillen = length() - substart;
|
2019-09-21 00:43:37 +03:00
|
|
|
if (taillen != 0 || keep_empty)
|
2019-04-16 03:39:16 +03:00
|
|
|
v.append(substring_view(substart, taillen));
|
|
|
|
return v;
|
|
|
|
}
|
|
|
|
|
2020-05-27 23:21:43 +03:00
|
|
|
Vector<StringView> StringView::split_view(const StringView& separator, bool keep_empty) const
|
|
|
|
{
|
|
|
|
ASSERT(!separator.is_empty());
|
|
|
|
|
|
|
|
if (is_empty())
|
|
|
|
return {};
|
|
|
|
|
|
|
|
StringView view { *this };
|
|
|
|
|
|
|
|
Vector<StringView> parts;
|
|
|
|
|
2021-01-12 23:00:44 +03:00
|
|
|
auto maybe_separator_index = find(separator);
|
2020-05-27 23:21:43 +03:00
|
|
|
while (maybe_separator_index.has_value()) {
|
|
|
|
auto separator_index = maybe_separator_index.value();
|
|
|
|
auto part_with_separator = view.substring_view(0, separator_index + separator.length());
|
|
|
|
if (keep_empty || separator_index > 0)
|
|
|
|
parts.append(part_with_separator.substring_view(0, separator_index));
|
|
|
|
view = view.substring_view_starting_after_substring(part_with_separator);
|
2021-01-12 23:00:44 +03:00
|
|
|
maybe_separator_index = view.find(separator);
|
2020-05-27 23:21:43 +03:00
|
|
|
}
|
|
|
|
if (keep_empty || !view.is_empty())
|
|
|
|
parts.append(view);
|
|
|
|
|
|
|
|
return parts;
|
|
|
|
}
|
|
|
|
|
2019-12-02 15:42:33 +03:00
|
|
|
Vector<StringView> StringView::lines(bool consider_cr) const
|
|
|
|
{
|
|
|
|
if (is_empty())
|
|
|
|
return {};
|
|
|
|
|
|
|
|
if (!consider_cr)
|
|
|
|
return split_view('\n', true);
|
|
|
|
|
|
|
|
Vector<StringView> v;
|
2019-12-09 19:45:40 +03:00
|
|
|
size_t substart = 0;
|
2019-12-02 15:42:33 +03:00
|
|
|
bool last_ch_was_cr = false;
|
|
|
|
bool split_view = false;
|
2019-12-09 19:45:40 +03:00
|
|
|
for (size_t i = 0; i < length(); ++i) {
|
2019-12-02 15:42:33 +03:00
|
|
|
char ch = characters_without_null_termination()[i];
|
|
|
|
if (ch == '\n') {
|
|
|
|
split_view = true;
|
|
|
|
if (last_ch_was_cr) {
|
|
|
|
substart = i + 1;
|
|
|
|
split_view = false;
|
|
|
|
last_ch_was_cr = false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (ch == '\r') {
|
|
|
|
split_view = true;
|
|
|
|
last_ch_was_cr = true;
|
|
|
|
}
|
|
|
|
if (split_view) {
|
2019-12-09 19:45:40 +03:00
|
|
|
size_t sublen = i - substart;
|
2019-12-02 22:41:15 +03:00
|
|
|
v.append(substring_view(substart, sublen));
|
2019-12-02 15:42:33 +03:00
|
|
|
substart = i + 1;
|
|
|
|
}
|
|
|
|
split_view = false;
|
|
|
|
}
|
2019-12-09 19:45:40 +03:00
|
|
|
size_t taillen = length() - substart;
|
2019-12-02 15:42:33 +03:00
|
|
|
if (taillen != 0)
|
|
|
|
v.append(substring_view(substart, taillen));
|
|
|
|
return v;
|
|
|
|
}
|
|
|
|
|
2020-02-15 00:14:22 +03:00
|
|
|
bool StringView::starts_with(char ch) const
|
|
|
|
{
|
|
|
|
if (is_empty())
|
|
|
|
return false;
|
|
|
|
return ch == characters_without_null_termination()[0];
|
|
|
|
}
|
|
|
|
|
2020-07-18 19:59:38 +03:00
|
|
|
bool StringView::starts_with(const StringView& str, CaseSensitivity case_sensitivity) const
|
2019-09-12 14:13:07 +03:00
|
|
|
{
|
2020-07-18 19:59:38 +03:00
|
|
|
return StringUtils::starts_with(*this, str, case_sensitivity);
|
2019-09-12 14:13:07 +03:00
|
|
|
}
|
|
|
|
|
2020-02-15 00:14:22 +03:00
|
|
|
bool StringView::ends_with(char ch) const
|
|
|
|
{
|
|
|
|
if (is_empty())
|
|
|
|
return false;
|
|
|
|
return ch == characters_without_null_termination()[length() - 1];
|
|
|
|
}
|
|
|
|
|
2020-05-26 13:21:34 +03:00
|
|
|
bool StringView::ends_with(const StringView& str, CaseSensitivity case_sensitivity) const
|
2019-12-29 15:44:30 +03:00
|
|
|
{
|
2020-05-26 13:21:34 +03:00
|
|
|
return StringUtils::ends_with(*this, str, case_sensitivity);
|
2019-12-29 15:44:30 +03:00
|
|
|
}
|
|
|
|
|
2020-10-25 08:34:39 +03:00
|
|
|
bool StringView::matches(const StringView& mask, Vector<MaskSpan>& mask_spans, CaseSensitivity case_sensitivity) const
|
|
|
|
{
|
|
|
|
return StringUtils::matches(*this, mask, case_sensitivity, &mask_spans);
|
|
|
|
}
|
|
|
|
|
2020-02-26 10:25:24 +03:00
|
|
|
bool StringView::matches(const StringView& mask, CaseSensitivity case_sensitivity) const
|
|
|
|
{
|
|
|
|
return StringUtils::matches(*this, mask, case_sensitivity);
|
|
|
|
}
|
|
|
|
|
2020-04-17 16:04:40 +03:00
|
|
|
bool StringView::contains(char needle) const
|
|
|
|
{
|
|
|
|
for (char current : *this) {
|
|
|
|
if (current == needle)
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2020-10-21 00:07:03 +03:00
|
|
|
bool StringView::contains(const StringView& needle, CaseSensitivity case_sensitivity) const
|
2020-07-04 21:04:00 +03:00
|
|
|
{
|
2020-10-21 00:07:03 +03:00
|
|
|
return StringUtils::contains(*this, needle, case_sensitivity);
|
2020-07-04 21:04:00 +03:00
|
|
|
}
|
|
|
|
|
2020-05-13 19:59:31 +03:00
|
|
|
bool StringView::equals_ignoring_case(const StringView& other) const
|
|
|
|
{
|
|
|
|
return StringUtils::equals_ignoring_case(*this, other);
|
|
|
|
}
|
|
|
|
|
2019-12-09 19:45:40 +03:00
|
|
|
StringView StringView::substring_view(size_t start, size_t length) const
|
2019-04-16 03:39:16 +03:00
|
|
|
{
|
|
|
|
ASSERT(start + length <= m_length);
|
|
|
|
return { m_characters + start, length };
|
|
|
|
}
|
2020-09-19 16:19:34 +03:00
|
|
|
StringView StringView::substring_view(size_t start) const
|
|
|
|
{
|
|
|
|
ASSERT(start <= m_length);
|
|
|
|
return { m_characters + start, length() - start };
|
|
|
|
}
|
2019-04-16 03:39:16 +03:00
|
|
|
|
2019-06-13 16:30:55 +03:00
|
|
|
StringView StringView::substring_view_starting_from_substring(const StringView& substring) const
|
|
|
|
{
|
2019-07-08 16:38:44 +03:00
|
|
|
const char* remaining_characters = substring.characters_without_null_termination();
|
2019-06-13 16:30:55 +03:00
|
|
|
ASSERT(remaining_characters >= m_characters);
|
|
|
|
ASSERT(remaining_characters <= m_characters + m_length);
|
2019-12-09 19:45:40 +03:00
|
|
|
size_t remaining_length = m_length - (remaining_characters - m_characters);
|
2019-06-13 16:30:55 +03:00
|
|
|
return { remaining_characters, remaining_length };
|
|
|
|
}
|
|
|
|
|
|
|
|
StringView StringView::substring_view_starting_after_substring(const StringView& substring) const
|
|
|
|
{
|
2019-07-08 16:38:44 +03:00
|
|
|
const char* remaining_characters = substring.characters_without_null_termination() + substring.length();
|
2019-06-13 16:30:55 +03:00
|
|
|
ASSERT(remaining_characters >= m_characters);
|
|
|
|
ASSERT(remaining_characters <= m_characters + m_length);
|
2019-12-09 19:45:40 +03:00
|
|
|
size_t remaining_length = m_length - (remaining_characters - m_characters);
|
2019-06-13 16:30:55 +03:00
|
|
|
return { remaining_characters, remaining_length };
|
|
|
|
}
|
|
|
|
|
2020-12-10 16:17:30 +03:00
|
|
|
template<typename T>
|
|
|
|
Optional<T> StringView::to_int() const
|
2019-08-04 12:44:20 +03:00
|
|
|
{
|
2020-12-10 16:17:30 +03:00
|
|
|
return StringUtils::convert_to_int<T>(*this);
|
2019-08-04 12:44:20 +03:00
|
|
|
}
|
|
|
|
|
2020-12-10 16:17:30 +03:00
|
|
|
template Optional<i8> StringView::to_int() const;
|
|
|
|
template Optional<i16> StringView::to_int() const;
|
|
|
|
template Optional<i32> StringView::to_int() const;
|
|
|
|
template Optional<i64> StringView::to_int() const;
|
|
|
|
|
|
|
|
template<typename T>
|
|
|
|
Optional<T> StringView::to_uint() const
|
2019-04-16 03:39:16 +03:00
|
|
|
{
|
2020-12-10 16:17:30 +03:00
|
|
|
return StringUtils::convert_to_uint<T>(*this);
|
2019-04-16 03:39:16 +03:00
|
|
|
}
|
|
|
|
|
2020-12-10 16:17:30 +03:00
|
|
|
template Optional<u8> StringView::to_uint() const;
|
|
|
|
template Optional<u16> StringView::to_uint() const;
|
|
|
|
template Optional<u32> StringView::to_uint() const;
|
|
|
|
template Optional<u64> StringView::to_uint() const;
|
2021-01-11 21:09:22 +03:00
|
|
|
template Optional<long> StringView::to_uint() const;
|
|
|
|
template Optional<long long> StringView::to_uint() const;
|
2020-12-10 16:17:30 +03:00
|
|
|
|
2019-08-24 23:31:06 +03:00
|
|
|
unsigned StringView::hash() const
|
|
|
|
{
|
|
|
|
if (is_empty())
|
|
|
|
return 0;
|
|
|
|
if (m_impl)
|
|
|
|
return m_impl->hash();
|
|
|
|
return string_hash(characters_without_null_termination(), length());
|
|
|
|
}
|
|
|
|
|
2020-03-23 15:45:10 +03:00
|
|
|
bool StringView::operator==(const String& string) const
|
|
|
|
{
|
|
|
|
if (string.is_null())
|
|
|
|
return !m_characters;
|
|
|
|
if (!m_characters)
|
|
|
|
return false;
|
|
|
|
if (m_length != string.length())
|
|
|
|
return false;
|
|
|
|
if (m_characters == string.characters())
|
|
|
|
return true;
|
|
|
|
return !__builtin_memcmp(m_characters, string.characters(), m_length);
|
|
|
|
}
|
|
|
|
|
2020-05-02 21:21:20 +03:00
|
|
|
Optional<size_t> StringView::find_first_of(char c) const
|
|
|
|
{
|
2021-01-15 01:48:01 +03:00
|
|
|
if (const auto location = AK::find(begin(), end(), c); location != end()) {
|
|
|
|
return location.index();
|
2020-05-02 21:21:20 +03:00
|
|
|
}
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
|
|
|
Optional<size_t> StringView::find_first_of(const StringView& view) const
|
|
|
|
{
|
2021-01-15 01:48:01 +03:00
|
|
|
if (const auto location = AK::find_if(begin(), end(),
|
|
|
|
[&](const auto c) {
|
|
|
|
return AK::any_of(view.begin(), view.end(),
|
|
|
|
[&](const auto view_char) {
|
|
|
|
return c == view_char;
|
|
|
|
});
|
|
|
|
});
|
|
|
|
location != end()) {
|
|
|
|
return location.index();
|
2020-05-02 21:21:20 +03:00
|
|
|
}
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
|
|
|
Optional<size_t> StringView::find_last_of(char c) const
|
|
|
|
{
|
2020-05-27 23:21:43 +03:00
|
|
|
for (size_t pos = m_length; --pos > 0;) {
|
2020-05-02 21:21:20 +03:00
|
|
|
if (m_characters[pos] == c)
|
|
|
|
return pos;
|
|
|
|
}
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
|
|
|
Optional<size_t> StringView::find_last_of(const StringView& view) const
|
|
|
|
{
|
|
|
|
for (size_t pos = m_length - 1; --pos > 0;) {
|
|
|
|
char c = m_characters[pos];
|
|
|
|
for (char view_char : view) {
|
|
|
|
if (c == view_char)
|
|
|
|
return pos;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
2021-01-12 22:58:45 +03:00
|
|
|
Optional<size_t> StringView::find(char c) const
|
|
|
|
{
|
|
|
|
return find(StringView { &c, 1 });
|
|
|
|
}
|
|
|
|
|
|
|
|
Optional<size_t> StringView::find(const StringView& view) const
|
|
|
|
{
|
|
|
|
return StringUtils::find(*this, view);
|
|
|
|
}
|
|
|
|
|
2020-05-06 19:53:05 +03:00
|
|
|
String StringView::to_string() const { return String { *this }; }
|
|
|
|
|
2019-04-16 03:39:16 +03:00
|
|
|
}
|