2012-10-08 16:25:58 +04:00
|
|
|
#ifndef utf8_iterator_hh_INCLUDED
|
|
|
|
#define utf8_iterator_hh_INCLUDED
|
|
|
|
|
|
|
|
#include "utf8.hh"
|
|
|
|
|
|
|
|
namespace Kakoune
|
|
|
|
{
|
|
|
|
|
|
|
|
namespace utf8
|
|
|
|
{
|
|
|
|
|
|
|
|
// adapter for an iterator on bytes which permits to iterate
|
|
|
|
// on unicode codepoints instead.
|
2012-10-13 20:31:29 +04:00
|
|
|
template<typename Iterator,
|
2014-07-03 00:14:01 +04:00
|
|
|
typename InvalidPolicy = utf8::InvalidPolicy::Assert>
|
2014-06-24 22:10:57 +04:00
|
|
|
class iterator
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
|
|
|
public:
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator() = default;
|
|
|
|
iterator(Iterator it) : m_it(std::move(it)) {}
|
2012-10-08 16:25:58 +04:00
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator& operator++()
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
2014-07-03 00:14:01 +04:00
|
|
|
m_it = utf8::next(m_it, Iterator{});
|
2012-10-08 16:25:58 +04:00
|
|
|
invalidate_value();
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator operator++(int)
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator save = *this;
|
2012-10-08 16:25:58 +04:00
|
|
|
++*this;
|
|
|
|
return save;
|
|
|
|
}
|
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
void advance(CharCount count, const iterator& end)
|
2013-03-06 22:03:43 +04:00
|
|
|
{
|
|
|
|
while (*this != end and count-- > 0)
|
|
|
|
++*this;
|
|
|
|
}
|
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator& operator--()
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
2014-07-03 00:14:01 +04:00
|
|
|
m_it = utf8::previous(m_it, Iterator{});
|
2012-10-08 16:25:58 +04:00
|
|
|
invalidate_value();
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator operator--(int)
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator save = *this;
|
2012-10-08 16:25:58 +04:00
|
|
|
--*this;
|
|
|
|
return save;
|
|
|
|
}
|
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator operator+(CharCount count) const
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
|
|
|
if (count < 0)
|
2013-12-03 23:48:53 +04:00
|
|
|
return operator-(-count);
|
2012-10-08 16:25:58 +04:00
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator res = *this;
|
2012-10-08 16:25:58 +04:00
|
|
|
while (count--)
|
|
|
|
++res;
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator operator-(CharCount count) const
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
|
|
|
if (count < 0)
|
2013-12-03 23:48:53 +04:00
|
|
|
return operator+(-count);
|
2012-10-08 16:25:58 +04:00
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator res = *this;
|
2012-10-08 16:25:58 +04:00
|
|
|
while (count--)
|
|
|
|
--res;
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
bool operator==(const iterator& other) { return m_it == other.m_it; }
|
|
|
|
bool operator!=(const iterator& other) { return m_it != other.m_it; }
|
2012-10-08 16:25:58 +04:00
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
bool operator< (const iterator& other) const
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
|
|
|
return m_it < other.m_it;
|
|
|
|
}
|
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
bool operator<= (const iterator& other) const
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
|
|
|
return m_it <= other.m_it;
|
|
|
|
}
|
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
bool operator> (const iterator& other) const
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
|
|
|
return m_it > other.m_it;
|
|
|
|
}
|
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
bool operator>= (const iterator& other) const
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
|
|
|
return m_it >= other.m_it;
|
|
|
|
}
|
|
|
|
|
2014-06-24 22:10:57 +04:00
|
|
|
CharCount operator-(iterator other) const
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
2013-04-09 22:04:11 +04:00
|
|
|
//kak_assert(other < *this);
|
2012-10-08 16:25:58 +04:00
|
|
|
check_invariant();
|
|
|
|
other.check_invariant();
|
2012-10-27 15:26:40 +04:00
|
|
|
CharCount dist = 0;
|
2014-05-21 03:25:24 +04:00
|
|
|
while (other.m_it < m_it)
|
2012-10-08 16:25:58 +04:00
|
|
|
{
|
|
|
|
++dist;
|
|
|
|
++other;
|
|
|
|
}
|
|
|
|
return dist;
|
|
|
|
}
|
|
|
|
|
|
|
|
Codepoint operator*() const
|
|
|
|
{
|
|
|
|
return get_value();
|
|
|
|
}
|
|
|
|
|
2013-06-05 21:19:35 +04:00
|
|
|
const Iterator& base() const { return m_it; }
|
|
|
|
Iterator& base() { return m_it; }
|
2012-10-08 16:25:58 +04:00
|
|
|
|
|
|
|
protected:
|
|
|
|
void check_invariant() const
|
|
|
|
{
|
|
|
|
// always point to a character first byte;
|
2013-04-09 22:04:11 +04:00
|
|
|
// kak_assert(is_character_start(it));
|
2012-10-08 16:25:58 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
void invalidate_value() { m_value = -1; }
|
|
|
|
Codepoint get_value() const
|
|
|
|
{
|
|
|
|
if (m_value == -1)
|
2014-07-03 00:14:01 +04:00
|
|
|
m_value = utf8::codepoint<InvalidPolicy>(m_it, Iterator{});
|
2012-10-08 16:25:58 +04:00
|
|
|
return m_value;
|
|
|
|
}
|
|
|
|
|
|
|
|
Iterator m_it;
|
|
|
|
mutable Codepoint m_value = -1;
|
|
|
|
};
|
|
|
|
|
2014-07-03 00:14:01 +04:00
|
|
|
template<typename InvalidPolicy = utf8::InvalidPolicy::Assert, typename Iterator>
|
2014-06-24 22:10:57 +04:00
|
|
|
iterator<Iterator, InvalidPolicy> make_iterator(Iterator it)
|
2013-06-05 21:19:49 +04:00
|
|
|
{
|
2014-06-24 22:10:57 +04:00
|
|
|
return iterator<Iterator, InvalidPolicy>{std::move(it)};
|
2012-10-08 16:25:58 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2013-06-05 21:19:49 +04:00
|
|
|
}
|
2012-10-08 16:25:58 +04:00
|
|
|
#endif // utf8_iterator_hh_INCLUDED
|