From c06f4ac6f58261c079721b54058989d7695ef9c3 Mon Sep 17 00:00:00 2001
From: Sam Atkins <atkinssj@serenityos.org>
Date: Tue, 28 Feb 2023 11:11:39 +0000
Subject: [PATCH] AK+Everywhere: Make GenericLexer::ignore_until() stop before
 the value

`consume_until(foo)` stops before foo, and so does
`ignore_until(Predicate)`, so let's make the other `ignore_until()`
overloads consistent with that so they're less confusing.
---
 AK/GenericLexer.h                                   |  5 +----
 .../Lagom/Tools/CodeGenerators/IPCCompiler/main.cpp |  2 +-
 Tests/AK/TestGenericLexer.cpp                       |  4 ++--
 Userland/Libraries/LibCpp/Preprocessor.cpp          | 13 ++++++++-----
 Userland/Libraries/LibWeb/MimeSniff/MimeType.cpp    |  5 +----
 5 files changed, 13 insertions(+), 16 deletions(-)
diff --git a/AK/GenericLexer.h b/AK/GenericLexer.h
index 508c4df3a29..d37af0608d2 100644
--- a/AK/GenericLexer.h
+++ b/AK/GenericLexer.h
@@ -142,7 +142,6 @@ public:
         while (!is_eof() && peek() != stop) {
             ++m_index;
         }
-        ignore();
     }
 
     constexpr void ignore_until(char const* stop)
@@ -150,7 +149,6 @@ public:
         while (!is_eof() && !next_is(stop)) {
             ++m_index;
         }
-        ignore(__builtin_strlen(stop));
     }
 
     /*
@@ -205,8 +203,7 @@ public:
             ++m_index;
     }
 
-    // Ignore characters until `pred` return true
-    // We don't skip the stop character as it may not be a unique value
+    // Ignore characters until `pred` returns true
     template<typename TPredicate>
     constexpr void ignore_until(TPredicate pred)
     {
diff --git a/Meta/Lagom/Tools/CodeGenerators/IPCCompiler/main.cpp b/Meta/Lagom/Tools/CodeGenerators/IPCCompiler/main.cpp
index e6a988bafee..f03f5a571b4 100644
--- a/Meta/Lagom/Tools/CodeGenerators/IPCCompiler/main.cpp
+++ b/Meta/Lagom/Tools/CodeGenerators/IPCCompiler/main.cpp
@@ -105,7 +105,7 @@ Vector<Endpoint> parse(ByteBuffer const& file_contents)
     auto consume_whitespace = [&lexer] {
         lexer.ignore_while([](char ch) { return isspace(ch); });
         if (lexer.peek() == '/' && lexer.peek(1) == '/')
-            lexer.ignore_until([](char ch) { return ch == '\n'; });
+            lexer.ignore_until('\n');
     };
 
     auto parse_parameter = [&](Vector<Parameter>& storage) {
diff --git a/Tests/AK/TestGenericLexer.cpp b/Tests/AK/TestGenericLexer.cpp
index 86e2383ed54..39cb03d2784 100644
--- a/Tests/AK/TestGenericLexer.cpp
+++ b/Tests/AK/TestGenericLexer.cpp
@@ -107,7 +107,7 @@ TEST_CASE(should_constexpr_ignore_until)
         sut.ignore_until('d');
         return sut;
     }();
-    static_assert(sut.peek() == 'e');
+    static_assert(sut.peek() == 'd');
 }
 
 TEST_CASE(should_constexpr_ignore_until_cstring)
@@ -117,7 +117,7 @@ TEST_CASE(should_constexpr_ignore_until_cstring)
         sut.ignore_until("cde");
         return sut;
     }();
-    static_assert(sut.peek() == 'f');
+    static_assert(sut.peek() == 'c');
 }
 
 TEST_CASE(should_constexpr_next_is_pred)
diff --git a/Userland/Libraries/LibCpp/Preprocessor.cpp b/Userland/Libraries/LibCpp/Preprocessor.cpp
index a5b3815e565..128b215b158 100644
--- a/Userland/Libraries/LibCpp/Preprocessor.cpp
+++ b/Userland/Libraries/LibCpp/Preprocessor.cpp
@@ -72,21 +72,24 @@ static void consume_whitespace(GenericLexer& lexer)
                 lexer.ignore(2);
             } else {
                 lexer.ignore_until('\n');
+                lexer.ignore();
                 break;
             }
         }
     };
     for (;;) {
-        if (lexer.consume_specific("//"sv))
+        if (lexer.consume_specific("//"sv)) {
             ignore_line();
-        else if (lexer.consume_specific("/*"sv))
+        } else if (lexer.consume_specific("/*"sv)) {
             lexer.ignore_until("*/");
-        else if (lexer.next_is("\\\n"sv))
             lexer.ignore(2);
-        else if (lexer.is_eof() || !lexer.next_is(isspace))
+        } else if (lexer.next_is("\\\n"sv)) {
+            lexer.ignore(2);
+        } else if (lexer.is_eof() || !lexer.next_is(isspace)) {
             break;
-        else
+        } else {
             lexer.ignore();
+        }
     }
 }
 
diff --git a/Userland/Libraries/LibWeb/MimeSniff/MimeType.cpp b/Userland/Libraries/LibWeb/MimeSniff/MimeType.cpp
index b138a6e4126..3b4a3ae1ca3 100644
--- a/Userland/Libraries/LibWeb/MimeSniff/MimeType.cpp
+++ b/Userland/Libraries/LibWeb/MimeSniff/MimeType.cpp
@@ -139,10 +139,7 @@ Optional<MimeType> MimeType::from_string(StringView string)
             parameter_value = Fetch::Infrastructure::collect_an_http_quoted_string(lexer, Fetch::Infrastructure::HttpQuotedStringExtractValue::Yes);
 
             // 2. Collect a sequence of code points that are not U+003B (;) from input, given position.
-            // NOTE: This uses the predicate version as the ignore_until(char) version will also ignore the ';'.
-            lexer.ignore_until([](char ch) {
-                return ch == ';';
-            });
+            lexer.ignore_until(';');
         }
 
         // 9. Otherwise: