2021-04-22 06:19:39 +03:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2021, the SerenityOS developers.
|
|
|
|
*
|
|
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
|
|
|
*/
|
|
|
|
|
2021-04-25 08:53:23 +03:00
|
|
|
#include <LibTest/TestCase.h>
|
2021-04-22 06:19:39 +03:00
|
|
|
|
|
|
|
#include <AK/GenericLexer.h>
|
|
|
|
#include <AK/StringView.h>
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_construct_from_empty_string_view)
|
|
|
|
{
|
|
|
|
constexpr GenericLexer sut(StringView {});
|
|
|
|
static_assert(sut.is_eof());
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_construct_from_string_view)
|
|
|
|
{
|
2021-07-04 12:08:46 +03:00
|
|
|
constexpr GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
static_assert(!sut.is_eof());
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_tell)
|
|
|
|
{
|
2021-07-04 12:08:46 +03:00
|
|
|
constexpr GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
static_assert(sut.tell() == 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_tell_remaining)
|
|
|
|
{
|
2021-07-04 12:08:46 +03:00
|
|
|
constexpr GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
static_assert(sut.tell_remaining() == 6);
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_peek)
|
|
|
|
{
|
2021-07-04 12:08:46 +03:00
|
|
|
constexpr GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
static_assert(sut.peek() == 'a');
|
|
|
|
static_assert(sut.peek(2) == 'c');
|
|
|
|
static_assert(sut.peek(100) == '\0');
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_next_is)
|
|
|
|
{
|
2021-07-04 12:08:46 +03:00
|
|
|
constexpr GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
static_assert(sut.next_is('a'));
|
|
|
|
static_assert(sut.next_is("abc"));
|
2021-07-04 12:08:46 +03:00
|
|
|
static_assert(sut.next_is("abc"sv));
|
2021-04-22 06:19:39 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_retreat)
|
|
|
|
{
|
|
|
|
constexpr auto sut = [] {
|
2021-07-04 12:08:46 +03:00
|
|
|
GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
sut.consume();
|
|
|
|
sut.retreat();
|
|
|
|
return sut;
|
|
|
|
}();
|
|
|
|
static_assert(sut.peek() == 'a');
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_consume_1)
|
|
|
|
{
|
|
|
|
constexpr auto sut = [] {
|
2021-07-04 12:08:46 +03:00
|
|
|
GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
sut.consume();
|
|
|
|
return sut;
|
|
|
|
}();
|
|
|
|
static_assert(sut.peek() == 'b');
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_consume_specific_char)
|
|
|
|
{
|
|
|
|
constexpr auto sut = [] {
|
2021-07-04 12:08:46 +03:00
|
|
|
GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
sut.consume_specific('a');
|
|
|
|
return sut;
|
|
|
|
}();
|
|
|
|
static_assert(sut.peek() == 'b');
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_consume_specific_string_view)
|
|
|
|
{
|
|
|
|
constexpr auto sut = [] {
|
2021-07-04 12:08:46 +03:00
|
|
|
GenericLexer sut("abcdef"sv);
|
|
|
|
sut.consume_specific("ab"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
return sut;
|
|
|
|
}();
|
|
|
|
static_assert(sut.peek() == 'c');
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_consume_specific_cstring)
|
|
|
|
{
|
|
|
|
constexpr auto sut = [] {
|
2021-07-04 12:08:46 +03:00
|
|
|
GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
sut.consume_specific("abcd");
|
|
|
|
return sut;
|
|
|
|
}();
|
|
|
|
static_assert(sut.peek() == 'e');
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_ignore_until)
|
|
|
|
{
|
|
|
|
constexpr auto sut = [] {
|
2021-07-04 12:08:46 +03:00
|
|
|
GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
sut.ignore_until('d');
|
|
|
|
return sut;
|
|
|
|
}();
|
|
|
|
static_assert(sut.peek() == 'e');
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_ignore_until_cstring)
|
|
|
|
{
|
|
|
|
constexpr auto sut = [] {
|
2021-07-04 12:08:46 +03:00
|
|
|
GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
sut.ignore_until("cde");
|
|
|
|
return sut;
|
|
|
|
}();
|
|
|
|
static_assert(sut.peek() == 'f');
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_next_is_pred)
|
|
|
|
{
|
|
|
|
constexpr auto pred = [](auto c) {
|
|
|
|
return c == 'a';
|
|
|
|
};
|
2021-07-04 12:08:46 +03:00
|
|
|
constexpr GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
static_assert(sut.next_is(pred));
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_ignore_while_pred)
|
|
|
|
{
|
|
|
|
constexpr auto sut = [] {
|
|
|
|
constexpr auto pred = [](auto c) {
|
|
|
|
return c == 'a';
|
|
|
|
};
|
|
|
|
|
2021-07-04 12:08:46 +03:00
|
|
|
GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
sut.ignore_while(pred);
|
|
|
|
return sut;
|
|
|
|
}();
|
|
|
|
static_assert(sut.peek() == 'b');
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE(should_constexpr_ignore_until_pred)
|
|
|
|
{
|
|
|
|
constexpr auto sut = [] {
|
|
|
|
constexpr auto pred = [](auto c) {
|
|
|
|
return c == 'c';
|
|
|
|
};
|
|
|
|
|
2021-07-04 12:08:46 +03:00
|
|
|
GenericLexer sut("abcdef"sv);
|
2021-04-22 06:19:39 +03:00
|
|
|
sut.ignore_until(pred);
|
|
|
|
return sut;
|
|
|
|
}();
|
|
|
|
static_assert(sut.peek() == 'c');
|
|
|
|
}
|
2021-08-18 05:20:04 +03:00
|
|
|
|
|
|
|
TEST_CASE(consume_escaped_code_point)
|
|
|
|
{
|
|
|
|
auto test = [](StringView test, Result<u32, GenericLexer::UnicodeEscapeError> expected, bool combine_surrogate_pairs = true) {
|
|
|
|
GenericLexer lexer(test);
|
|
|
|
|
|
|
|
auto actual = lexer.consume_escaped_code_point(combine_surrogate_pairs);
|
|
|
|
EXPECT_EQ(actual.is_error(), expected.is_error());
|
|
|
|
|
|
|
|
if (actual.is_error() && expected.is_error())
|
|
|
|
EXPECT_EQ(actual.error(), expected.error());
|
|
|
|
else
|
|
|
|
EXPECT_EQ(actual.value(), expected.value());
|
|
|
|
};
|
|
|
|
|
|
|
|
test("\\u"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\u{"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\u{1"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\u{}"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\u{x}"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
|
|
|
|
test("\\u{110000}"sv, GenericLexer::UnicodeEscapeError::UnicodeEscapeOverflow);
|
|
|
|
test("\\u{f00000000}"sv, GenericLexer::UnicodeEscapeError::UnicodeEscapeOverflow);
|
|
|
|
|
|
|
|
test("\\u{0}"sv, 0);
|
|
|
|
test("\\u{41}"sv, 0x41);
|
|
|
|
test("\\u{ffff}"sv, 0xffff);
|
|
|
|
test("\\u{10ffff}"sv, 0x10ffff);
|
|
|
|
|
|
|
|
test("\\u1"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\u11"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\u111"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\u111x"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\ud800\\u"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\ud800\\u1"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\ud800\\u11"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\ud800\\u111"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
test("\\ud800\\u111x"sv, GenericLexer::UnicodeEscapeError::MalformedUnicodeEscape);
|
|
|
|
|
|
|
|
test("\\u0000"sv, 0x0);
|
|
|
|
test("\\u0041"sv, 0x41);
|
|
|
|
test("\\uffff"sv, 0xffff);
|
|
|
|
|
|
|
|
test("\\ud83d"sv, 0xd83d);
|
|
|
|
test("\\ud83d\\u1111"sv, 0xd83d);
|
|
|
|
test("\\ud83d\\ude00"sv, 0x1f600);
|
|
|
|
test("\\ud83d\\ude00"sv, 0xd83d, false);
|
|
|
|
}
|