2011-09-21 18:37:09 +04:00
|
|
|
#include "selectors.hh"
|
|
|
|
|
2012-08-29 23:49:36 +04:00
|
|
|
#include "string.hh"
|
2012-10-08 21:12:09 +04:00
|
|
|
#include "utf8_iterator.hh"
|
|
|
|
|
2011-09-21 23:09:49 +04:00
|
|
|
#include <algorithm>
|
|
|
|
|
2013-04-22 16:18:49 +04:00
|
|
|
#include <boost/optional.hpp>
|
|
|
|
|
2011-09-21 18:37:09 +04:00
|
|
|
namespace Kakoune
|
|
|
|
{
|
|
|
|
|
2012-10-13 20:31:29 +04:00
|
|
|
using Utf8Iterator = utf8::utf8_iterator<BufferIterator, utf8::InvalidBytePolicy::Pass>;
|
2012-10-08 21:12:09 +04:00
|
|
|
|
2012-03-07 23:20:32 +04:00
|
|
|
namespace
|
|
|
|
{
|
|
|
|
|
|
|
|
template<bool punctuation_is_word = false>
|
2012-10-08 21:12:09 +04:00
|
|
|
bool is_word(Codepoint c)
|
2011-09-21 18:37:09 +04:00
|
|
|
{
|
2012-09-30 18:23:18 +04:00
|
|
|
return Kakoune::is_word(c);
|
2011-09-21 18:37:09 +04:00
|
|
|
}
|
|
|
|
|
2012-03-07 23:20:32 +04:00
|
|
|
template<>
|
2012-10-08 21:12:09 +04:00
|
|
|
bool is_word<true>(Codepoint c)
|
2012-03-07 23:20:32 +04:00
|
|
|
{
|
|
|
|
return !is_blank(c) and !is_eol(c);
|
|
|
|
}
|
|
|
|
|
2012-10-08 21:12:09 +04:00
|
|
|
static bool is_punctuation(Codepoint c)
|
2011-09-22 18:00:31 +04:00
|
|
|
{
|
2011-09-26 03:50:13 +04:00
|
|
|
return not (is_word(c) or is_blank(c) or is_eol(c));
|
2011-09-22 18:00:31 +04:00
|
|
|
}
|
|
|
|
|
2011-09-23 13:17:19 +04:00
|
|
|
enum class CharCategories
|
|
|
|
{
|
|
|
|
Blank,
|
2011-09-26 03:50:13 +04:00
|
|
|
EndOfLine,
|
2011-09-23 13:17:19 +04:00
|
|
|
Word,
|
|
|
|
Punctuation,
|
|
|
|
};
|
|
|
|
|
2012-03-07 23:20:32 +04:00
|
|
|
template<bool punctuation_is_word = false>
|
2012-10-08 21:12:09 +04:00
|
|
|
CharCategories categorize(Codepoint c)
|
2011-09-23 13:17:19 +04:00
|
|
|
{
|
|
|
|
if (is_word(c))
|
|
|
|
return CharCategories::Word;
|
2011-09-26 03:50:13 +04:00
|
|
|
if (is_eol(c))
|
|
|
|
return CharCategories::EndOfLine;
|
2011-09-23 13:17:19 +04:00
|
|
|
if (is_blank(c))
|
|
|
|
return CharCategories::Blank;
|
2012-03-07 23:20:32 +04:00
|
|
|
return punctuation_is_word ? CharCategories::Word
|
|
|
|
: CharCategories::Punctuation;
|
2011-09-23 13:17:19 +04:00
|
|
|
}
|
|
|
|
|
2012-10-08 21:12:09 +04:00
|
|
|
bool is_begin(const BufferIterator& it) { return it.is_begin(); }
|
|
|
|
bool is_end(const BufferIterator& it) { return it.is_end(); }
|
|
|
|
|
|
|
|
bool is_begin(const Utf8Iterator& it) { return it.underlying_iterator().is_begin(); }
|
|
|
|
bool is_end(const Utf8Iterator& it) { return it.underlying_iterator().is_end(); }
|
|
|
|
|
|
|
|
template<typename Iterator, typename T>
|
2013-01-03 17:30:14 +04:00
|
|
|
void skip_while(Iterator& it, T condition)
|
2011-09-22 18:00:31 +04:00
|
|
|
{
|
2012-10-08 21:12:09 +04:00
|
|
|
while (not is_end(it) and condition(*it))
|
2011-09-22 18:00:31 +04:00
|
|
|
++it;
|
|
|
|
}
|
|
|
|
|
2012-10-08 21:12:09 +04:00
|
|
|
template<typename Iterator, typename T>
|
2013-01-03 17:30:14 +04:00
|
|
|
void skip_while_reverse(Iterator& it, T condition)
|
2011-09-22 18:00:31 +04:00
|
|
|
{
|
2012-10-08 21:12:09 +04:00
|
|
|
while (not is_begin(it) and condition(*it))
|
2011-09-22 18:00:31 +04:00
|
|
|
--it;
|
2012-10-08 21:12:09 +04:00
|
|
|
}
|
|
|
|
|
2013-04-22 16:18:49 +04:00
|
|
|
Range utf8_range(const Utf8Iterator& first, const Utf8Iterator& last)
|
2012-10-08 21:12:09 +04:00
|
|
|
{
|
2013-04-22 16:18:49 +04:00
|
|
|
return Range{first.underlying_iterator(), last.underlying_iterator()};
|
2011-09-22 18:00:31 +04:00
|
|
|
}
|
|
|
|
|
2012-03-07 23:20:32 +04:00
|
|
|
}
|
|
|
|
|
2012-05-03 11:25:13 +04:00
|
|
|
typedef boost::regex_iterator<BufferIterator> RegexIterator;
|
|
|
|
|
2012-03-07 23:20:32 +04:00
|
|
|
template<bool punctuation_is_word>
|
2012-11-30 21:32:49 +04:00
|
|
|
Selection select_to_next_word(const Selection& selection)
|
2011-09-21 18:37:09 +04:00
|
|
|
{
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator begin = selection.last();
|
2012-03-07 23:20:32 +04:00
|
|
|
if (categorize<punctuation_is_word>(*begin) !=
|
|
|
|
categorize<punctuation_is_word>(*(begin+1)))
|
2011-09-23 13:17:19 +04:00
|
|
|
++begin;
|
2011-09-26 03:50:13 +04:00
|
|
|
|
|
|
|
skip_while(begin, is_eol);
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator end = begin+1;
|
2011-09-23 13:17:19 +04:00
|
|
|
|
2012-03-07 23:20:32 +04:00
|
|
|
if (not punctuation_is_word and is_punctuation(*begin))
|
2011-09-22 18:00:31 +04:00
|
|
|
skip_while(end, is_punctuation);
|
2012-03-07 23:20:32 +04:00
|
|
|
else if (is_word<punctuation_is_word>(*begin))
|
|
|
|
skip_while(end, is_word<punctuation_is_word>);
|
2011-09-23 13:17:19 +04:00
|
|
|
|
2013-01-03 17:30:14 +04:00
|
|
|
skip_while(end, is_blank);
|
2011-09-21 18:37:09 +04:00
|
|
|
|
2013-04-22 16:18:49 +04:00
|
|
|
return utf8_range(begin, end-1);
|
2011-09-21 18:37:09 +04:00
|
|
|
}
|
2012-11-30 21:32:49 +04:00
|
|
|
template Selection select_to_next_word<false>(const Selection&);
|
|
|
|
template Selection select_to_next_word<true>(const Selection&);
|
2011-09-21 18:37:09 +04:00
|
|
|
|
2012-03-07 23:20:32 +04:00
|
|
|
template<bool punctuation_is_word>
|
2012-11-30 21:32:49 +04:00
|
|
|
Selection select_to_next_word_end(const Selection& selection)
|
2011-09-21 18:37:09 +04:00
|
|
|
{
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator begin = selection.last();
|
2012-03-07 23:20:32 +04:00
|
|
|
if (categorize<punctuation_is_word>(*begin) !=
|
|
|
|
categorize<punctuation_is_word>(*(begin+1)))
|
2011-09-23 13:17:19 +04:00
|
|
|
++begin;
|
2011-09-21 18:37:09 +04:00
|
|
|
|
2011-09-26 03:50:13 +04:00
|
|
|
skip_while(begin, is_eol);
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator end = begin;
|
2011-09-22 18:00:31 +04:00
|
|
|
skip_while(end, is_blank);
|
|
|
|
|
2012-03-07 23:20:32 +04:00
|
|
|
if (not punctuation_is_word and is_punctuation(*end))
|
2013-01-03 17:30:14 +04:00
|
|
|
skip_while(end, is_punctuation);
|
2012-03-07 23:20:32 +04:00
|
|
|
else if (is_word<punctuation_is_word>(*end))
|
2013-01-03 17:30:14 +04:00
|
|
|
skip_while(end, is_word<punctuation_is_word>);
|
2011-09-21 18:37:09 +04:00
|
|
|
|
2013-04-22 16:18:49 +04:00
|
|
|
return utf8_range(begin, end-1);
|
2011-09-21 18:37:09 +04:00
|
|
|
}
|
2012-11-30 21:32:49 +04:00
|
|
|
template Selection select_to_next_word_end<false>(const Selection&);
|
|
|
|
template Selection select_to_next_word_end<true>(const Selection&);
|
2011-09-21 18:37:09 +04:00
|
|
|
|
2012-03-07 23:20:32 +04:00
|
|
|
template<bool punctuation_is_word>
|
2012-11-30 21:32:49 +04:00
|
|
|
Selection select_to_previous_word(const Selection& selection)
|
2011-09-21 18:37:09 +04:00
|
|
|
{
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator begin = selection.last();
|
2011-09-23 13:17:19 +04:00
|
|
|
|
2012-03-07 23:20:32 +04:00
|
|
|
if (categorize<punctuation_is_word>(*begin) !=
|
|
|
|
categorize<punctuation_is_word>(*(begin-1)))
|
2011-09-23 13:17:19 +04:00
|
|
|
--begin;
|
2011-09-21 18:37:09 +04:00
|
|
|
|
2011-09-26 03:50:13 +04:00
|
|
|
skip_while_reverse(begin, is_eol);
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator end = begin;
|
2011-09-22 18:00:31 +04:00
|
|
|
skip_while_reverse(end, is_blank);
|
2011-09-23 13:17:19 +04:00
|
|
|
|
2011-11-24 22:46:35 +04:00
|
|
|
bool with_end = false;
|
2012-03-07 23:20:32 +04:00
|
|
|
if (not punctuation_is_word and is_punctuation(*end))
|
2013-01-03 17:30:14 +04:00
|
|
|
{
|
|
|
|
skip_while_reverse(end, is_punctuation);
|
|
|
|
with_end = is_punctuation(*end);
|
|
|
|
}
|
2012-03-07 23:20:32 +04:00
|
|
|
else if (is_word<punctuation_is_word>(*end))
|
2013-01-03 17:30:14 +04:00
|
|
|
{
|
|
|
|
skip_while_reverse(end, is_word<punctuation_is_word>);
|
|
|
|
with_end = is_word<punctuation_is_word>(*end);
|
|
|
|
}
|
2011-10-25 22:46:14 +04:00
|
|
|
|
2013-04-22 16:18:49 +04:00
|
|
|
return utf8_range(begin, with_end ? end : end+1);
|
2011-10-25 22:46:14 +04:00
|
|
|
}
|
2012-11-30 21:32:49 +04:00
|
|
|
template Selection select_to_previous_word<false>(const Selection&);
|
|
|
|
template Selection select_to_previous_word<true>(const Selection&);
|
2011-10-25 22:46:14 +04:00
|
|
|
|
2012-11-30 21:32:49 +04:00
|
|
|
Selection select_line(const Selection& selection)
|
2011-09-21 18:37:09 +04:00
|
|
|
{
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator first = selection.last();
|
|
|
|
if (*first == '\n' and not is_end(first + 1))
|
2011-10-27 22:57:31 +04:00
|
|
|
++first;
|
|
|
|
|
2012-10-08 21:12:09 +04:00
|
|
|
while (not is_begin(first) and *(first - 1) != '\n')
|
2011-09-23 13:17:19 +04:00
|
|
|
--first;
|
|
|
|
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator last = first;
|
|
|
|
while (not is_end(last + 1) and *last != '\n')
|
2011-09-23 13:17:19 +04:00
|
|
|
++last;
|
2013-04-22 16:18:49 +04:00
|
|
|
return utf8_range(first, last);
|
2011-09-21 18:37:09 +04:00
|
|
|
}
|
|
|
|
|
2012-11-30 21:32:49 +04:00
|
|
|
Selection select_matching(const Selection& selection)
|
2011-09-21 23:09:49 +04:00
|
|
|
{
|
2012-10-11 03:17:29 +04:00
|
|
|
std::vector<Codepoint> matching_pairs = { '(', ')', '{', '}', '[', ']', '<', '>' };
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator it = selection.last();
|
2012-10-11 03:17:29 +04:00
|
|
|
std::vector<Codepoint>::iterator match = matching_pairs.end();
|
2011-09-21 23:09:49 +04:00
|
|
|
while (not is_eol(*it))
|
|
|
|
{
|
|
|
|
match = std::find(matching_pairs.begin(), matching_pairs.end(), *it);
|
|
|
|
if (match != matching_pairs.end())
|
|
|
|
break;
|
|
|
|
++it;
|
|
|
|
}
|
|
|
|
if (match == matching_pairs.end())
|
2012-02-07 18:26:51 +04:00
|
|
|
return selection;
|
2011-09-21 23:09:49 +04:00
|
|
|
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator begin = it;
|
2011-09-21 23:09:49 +04:00
|
|
|
|
|
|
|
if (((match - matching_pairs.begin()) % 2) == 0)
|
|
|
|
{
|
|
|
|
int level = 0;
|
2012-10-11 03:17:29 +04:00
|
|
|
const Codepoint opening = *match;
|
|
|
|
const Codepoint closing = *(match+1);
|
2012-10-08 21:12:09 +04:00
|
|
|
while (not is_end(it))
|
2011-09-21 23:09:49 +04:00
|
|
|
{
|
|
|
|
if (*it == opening)
|
|
|
|
++level;
|
|
|
|
else if (*it == closing and --level == 0)
|
2013-04-22 16:18:49 +04:00
|
|
|
return utf8_range(begin, it);
|
2011-09-21 23:09:49 +04:00
|
|
|
|
|
|
|
++it;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
int level = 0;
|
2012-10-11 03:17:29 +04:00
|
|
|
const Codepoint opening = *(match-1);
|
|
|
|
const Codepoint closing = *match;
|
2012-12-27 16:41:45 +04:00
|
|
|
while (true)
|
2011-09-21 23:09:49 +04:00
|
|
|
{
|
|
|
|
if (*it == closing)
|
|
|
|
++level;
|
|
|
|
else if (*it == opening and --level == 0)
|
2013-04-22 16:18:49 +04:00
|
|
|
return utf8_range(begin, it);
|
2012-12-27 16:41:45 +04:00
|
|
|
if (is_begin(it))
|
|
|
|
break;
|
2011-09-21 23:09:49 +04:00
|
|
|
--it;
|
|
|
|
}
|
|
|
|
}
|
2012-02-07 18:26:51 +04:00
|
|
|
return selection;
|
2011-09-21 23:09:49 +04:00
|
|
|
}
|
|
|
|
|
2013-04-22 16:18:49 +04:00
|
|
|
// c++14 will add std::optional, so we use boost::optional until then
|
|
|
|
using boost::optional;
|
|
|
|
static optional<Range> find_surrounding(const BufferIterator& pos,
|
|
|
|
const CodepointPair& matching,
|
2013-05-15 16:24:09 +04:00
|
|
|
ObjectFlags flags)
|
2012-01-04 18:18:08 +04:00
|
|
|
{
|
2013-05-15 16:24:09 +04:00
|
|
|
const bool to_begin = flags & ObjectFlags::ToBegin;
|
|
|
|
const bool to_end = flags & ObjectFlags::ToEnd;
|
2013-02-27 22:08:13 +04:00
|
|
|
const bool nestable = matching.first != matching.second;
|
2013-04-22 16:18:49 +04:00
|
|
|
Utf8Iterator first = pos;
|
2013-01-07 21:53:27 +04:00
|
|
|
if (to_begin)
|
2012-01-04 18:18:08 +04:00
|
|
|
{
|
2013-01-07 21:53:27 +04:00
|
|
|
int level = 0;
|
|
|
|
while (not is_begin(first))
|
2012-01-04 18:18:08 +04:00
|
|
|
{
|
2013-04-22 16:18:49 +04:00
|
|
|
if (nestable and first != pos and *first == matching.second)
|
2013-01-07 21:53:27 +04:00
|
|
|
++level;
|
|
|
|
else if (*first == matching.first)
|
|
|
|
{
|
|
|
|
if (level == 0)
|
|
|
|
break;
|
|
|
|
else
|
|
|
|
--level;
|
|
|
|
}
|
|
|
|
--first;
|
2012-01-04 18:18:08 +04:00
|
|
|
}
|
2013-01-07 21:53:27 +04:00
|
|
|
if (level != 0 or *first != matching.first)
|
2013-04-22 16:18:49 +04:00
|
|
|
return optional<Range>{};
|
2012-01-04 18:18:08 +04:00
|
|
|
}
|
|
|
|
|
2013-04-22 16:18:49 +04:00
|
|
|
Utf8Iterator last = pos;
|
2013-01-07 21:53:27 +04:00
|
|
|
if (to_end)
|
2012-01-04 18:18:08 +04:00
|
|
|
{
|
2013-01-07 21:53:27 +04:00
|
|
|
int level = 0;
|
|
|
|
last = first + 1;
|
|
|
|
while (not is_end(last))
|
2012-01-04 18:18:08 +04:00
|
|
|
{
|
2013-02-27 22:08:13 +04:00
|
|
|
if (nestable and *last == matching.first)
|
2013-01-07 21:53:27 +04:00
|
|
|
++level;
|
|
|
|
else if (*last == matching.second)
|
|
|
|
{
|
|
|
|
if (level == 0)
|
|
|
|
break;
|
|
|
|
else
|
|
|
|
--level;
|
|
|
|
}
|
|
|
|
++last;
|
2012-01-04 18:18:08 +04:00
|
|
|
}
|
2013-01-07 21:53:27 +04:00
|
|
|
if (level != 0 or *last != matching.second)
|
2013-04-22 16:18:49 +04:00
|
|
|
return optional<Range>{};
|
2012-01-04 18:18:08 +04:00
|
|
|
}
|
|
|
|
|
2013-05-15 16:24:09 +04:00
|
|
|
if (flags & ObjectFlags::Inner)
|
2012-01-04 18:18:08 +04:00
|
|
|
{
|
2013-01-07 21:53:27 +04:00
|
|
|
if (to_begin)
|
|
|
|
++first;
|
|
|
|
if (to_end and first != last)
|
2012-01-04 18:18:08 +04:00
|
|
|
--last;
|
|
|
|
}
|
2013-04-22 16:18:49 +04:00
|
|
|
return to_end ? utf8_range(first, last) : utf8_range(last, first);
|
|
|
|
}
|
|
|
|
|
|
|
|
Selection select_surrounding(const Selection& selection,
|
|
|
|
const CodepointPair& matching,
|
2013-05-15 16:24:09 +04:00
|
|
|
ObjectFlags flags)
|
2013-04-22 16:18:49 +04:00
|
|
|
{
|
|
|
|
auto res = find_surrounding(selection.last(), matching, flags);
|
|
|
|
if (not res)
|
|
|
|
return selection;
|
|
|
|
|
2013-05-15 16:24:09 +04:00
|
|
|
if (flags == (ObjectFlags::ToBegin | ObjectFlags::ToEnd) and
|
2013-04-22 16:18:49 +04:00
|
|
|
matching.first != matching.second and not res->last().is_end() and
|
|
|
|
(*res == selection or Range{res->last(), res->first()} == selection))
|
|
|
|
{
|
|
|
|
res = find_surrounding(res->last() + 1, matching, flags);
|
|
|
|
return res ? Selection{*res} : selection;
|
|
|
|
}
|
|
|
|
return *res;
|
2012-01-04 18:18:08 +04:00
|
|
|
}
|
|
|
|
|
2012-11-30 21:32:49 +04:00
|
|
|
Selection select_to(const Selection& selection,
|
|
|
|
Codepoint c, int count, bool inclusive)
|
2011-09-22 18:35:28 +04:00
|
|
|
{
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator begin = selection.last();
|
|
|
|
Utf8Iterator end = begin;
|
2011-09-27 18:27:48 +04:00
|
|
|
do
|
|
|
|
{
|
|
|
|
++end;
|
2013-03-19 02:47:18 +04:00
|
|
|
skip_while(end, [c](Codepoint cur) { return cur != c; });
|
|
|
|
if (is_end(end))
|
2012-02-07 18:26:51 +04:00
|
|
|
return selection;
|
2011-09-27 18:27:48 +04:00
|
|
|
}
|
|
|
|
while (--count > 0);
|
|
|
|
|
2013-04-22 16:18:49 +04:00
|
|
|
return utf8_range(begin, inclusive ? end : end-1);
|
2011-09-22 18:35:28 +04:00
|
|
|
}
|
|
|
|
|
2012-11-30 21:32:49 +04:00
|
|
|
Selection select_to_reverse(const Selection& selection,
|
|
|
|
Codepoint c, int count, bool inclusive)
|
2011-10-03 18:29:44 +04:00
|
|
|
{
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator begin = selection.last();
|
|
|
|
Utf8Iterator end = begin;
|
2011-10-03 18:29:44 +04:00
|
|
|
do
|
|
|
|
{
|
|
|
|
--end;
|
2013-03-19 02:47:18 +04:00
|
|
|
skip_while_reverse(end, [c](Codepoint cur) { return cur != c; });
|
|
|
|
if (is_begin(end))
|
2012-02-07 18:26:51 +04:00
|
|
|
return selection;
|
2011-10-03 18:29:44 +04:00
|
|
|
}
|
|
|
|
while (--count > 0);
|
|
|
|
|
2013-04-22 16:18:49 +04:00
|
|
|
return utf8_range(begin, inclusive ? end : end+1);
|
2011-10-03 18:29:44 +04:00
|
|
|
}
|
|
|
|
|
2012-11-30 21:32:49 +04:00
|
|
|
Selection select_to_eol(const Selection& selection)
|
2011-10-10 18:24:17 +04:00
|
|
|
{
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator begin = selection.last();
|
|
|
|
Utf8Iterator end = begin + 1;
|
|
|
|
skip_while(end, [](Codepoint cur) { return not is_eol(cur); });
|
2013-04-22 16:18:49 +04:00
|
|
|
return utf8_range(begin, end-1);
|
2011-10-10 18:24:17 +04:00
|
|
|
}
|
|
|
|
|
2012-11-30 21:32:49 +04:00
|
|
|
Selection select_to_eol_reverse(const Selection& selection)
|
2011-10-10 18:24:17 +04:00
|
|
|
{
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator begin = selection.last();
|
|
|
|
Utf8Iterator end = begin - 1;
|
|
|
|
skip_while_reverse(end, [](Codepoint cur) { return not is_eol(cur); });
|
2013-04-22 16:18:49 +04:00
|
|
|
return utf8_range(begin, is_begin(end) ? end : end+1);
|
2011-10-10 18:24:17 +04:00
|
|
|
}
|
|
|
|
|
2012-03-12 18:23:30 +04:00
|
|
|
template<bool punctuation_is_word>
|
2013-05-15 16:24:09 +04:00
|
|
|
Selection select_whole_word(const Selection& selection, ObjectFlags flags)
|
2012-03-12 18:23:30 +04:00
|
|
|
{
|
2012-10-08 21:12:09 +04:00
|
|
|
Utf8Iterator first = selection.last();
|
|
|
|
Utf8Iterator last = first;
|
2013-05-15 16:24:09 +04:00
|
|
|
if (is_word<punctuation_is_word>(*first))
|
2012-03-12 18:23:30 +04:00
|
|
|
{
|
2013-05-15 16:24:09 +04:00
|
|
|
if (flags & ObjectFlags::ToBegin)
|
|
|
|
{
|
|
|
|
skip_while_reverse(first, is_word<punctuation_is_word>);
|
|
|
|
if (not is_word<punctuation_is_word>(*first))
|
|
|
|
++first;
|
|
|
|
}
|
|
|
|
if (flags & ObjectFlags::ToEnd)
|
|
|
|
{
|
|
|
|
skip_while(last, is_word<punctuation_is_word>);
|
|
|
|
if (not (flags & ObjectFlags::Inner))
|
|
|
|
skip_while(last, is_blank);
|
|
|
|
--last;
|
|
|
|
}
|
2012-03-12 18:23:30 +04:00
|
|
|
}
|
2013-05-15 16:24:09 +04:00
|
|
|
else if (not (flags & ObjectFlags::Inner))
|
2012-03-12 18:23:30 +04:00
|
|
|
{
|
2013-05-15 16:24:09 +04:00
|
|
|
if (flags & ObjectFlags::ToBegin)
|
|
|
|
{
|
|
|
|
skip_while_reverse(first, is_blank);
|
|
|
|
if (not is_word<punctuation_is_word>(*first))
|
|
|
|
return selection;
|
|
|
|
skip_while_reverse(first, is_word<punctuation_is_word>);
|
|
|
|
if (not is_word<punctuation_is_word>(*first))
|
|
|
|
++first;
|
|
|
|
}
|
|
|
|
if (flags & ObjectFlags::ToEnd)
|
|
|
|
{
|
|
|
|
skip_while(last, is_blank);
|
|
|
|
--last;
|
|
|
|
}
|
2012-03-12 18:23:30 +04:00
|
|
|
}
|
2013-05-15 16:24:09 +04:00
|
|
|
return (flags & ObjectFlags::ToEnd) ? utf8_range(first, last)
|
|
|
|
: utf8_range(last, first);
|
2012-03-12 18:23:30 +04:00
|
|
|
}
|
2013-05-15 16:24:09 +04:00
|
|
|
template Selection select_whole_word<false>(const Selection&, ObjectFlags);
|
|
|
|
template Selection select_whole_word<true>(const Selection&, ObjectFlags);
|
2012-03-12 18:23:30 +04:00
|
|
|
|
2013-05-15 16:24:09 +04:00
|
|
|
Selection select_whole_sentence(const Selection& selection, ObjectFlags flags)
|
2013-04-30 16:21:48 +04:00
|
|
|
{
|
|
|
|
BufferIterator first = selection.last();
|
2013-05-15 16:24:09 +04:00
|
|
|
BufferIterator last = first;
|
2013-04-30 16:21:48 +04:00
|
|
|
|
2013-05-15 16:24:09 +04:00
|
|
|
if (flags & ObjectFlags::ToBegin)
|
2013-04-30 16:21:48 +04:00
|
|
|
{
|
2013-05-15 16:24:09 +04:00
|
|
|
bool saw_non_blank = false;
|
|
|
|
while (not is_begin(first))
|
2013-04-30 16:21:48 +04:00
|
|
|
{
|
2013-05-15 16:24:09 +04:00
|
|
|
char cur = *first;
|
|
|
|
char prev = *(first-1);
|
|
|
|
if (not is_blank(cur))
|
|
|
|
saw_non_blank = true;
|
|
|
|
if (is_eol(prev) and is_eol(cur))
|
|
|
|
{
|
|
|
|
++first;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
else if (prev == '.' or prev == ';' or prev == '!' or prev == '?')
|
|
|
|
{
|
|
|
|
if (saw_non_blank)
|
|
|
|
break;
|
|
|
|
else if (flags & ObjectFlags::ToEnd)
|
|
|
|
last = first-1;
|
|
|
|
}
|
|
|
|
--first;
|
2013-04-30 16:21:48 +04:00
|
|
|
}
|
2013-05-15 16:24:09 +04:00
|
|
|
skip_while(first, is_blank);
|
2013-04-30 16:21:48 +04:00
|
|
|
}
|
2013-05-15 16:24:09 +04:00
|
|
|
if (flags & ObjectFlags::ToEnd)
|
2013-04-30 16:21:48 +04:00
|
|
|
{
|
2013-05-15 16:24:09 +04:00
|
|
|
while (not is_end(last))
|
|
|
|
{
|
|
|
|
char cur = *last;
|
|
|
|
if (cur == '.' or cur == ';' or cur == '!' or cur == '?' or
|
|
|
|
(is_eol(cur) and (is_end(last+1) or is_eol(*last+1))))
|
|
|
|
break;
|
|
|
|
++last;
|
|
|
|
}
|
|
|
|
if (not (flags & ObjectFlags::Inner) and not is_end(last))
|
|
|
|
{
|
|
|
|
++last;
|
|
|
|
skip_while(last, is_blank);
|
|
|
|
--last;
|
|
|
|
}
|
2013-04-30 16:21:48 +04:00
|
|
|
}
|
2013-05-15 16:24:09 +04:00
|
|
|
return (flags & ObjectFlags::ToEnd) ? Selection{first, last}
|
|
|
|
: Selection{last, first};
|
2013-04-30 16:21:48 +04:00
|
|
|
}
|
|
|
|
|
2013-05-15 16:24:09 +04:00
|
|
|
Selection select_whole_paragraph(const Selection& selection, ObjectFlags flags)
|
2013-04-30 16:29:18 +04:00
|
|
|
{
|
|
|
|
BufferIterator first = selection.last();
|
2013-05-15 16:24:09 +04:00
|
|
|
BufferIterator last = first;
|
2013-04-30 16:29:18 +04:00
|
|
|
|
2013-05-15 16:24:09 +04:00
|
|
|
if (flags & ObjectFlags::ToBegin and not is_begin(first))
|
2013-04-30 16:29:18 +04:00
|
|
|
{
|
2013-05-15 16:24:09 +04:00
|
|
|
skip_while_reverse(first, is_eol);
|
|
|
|
if (flags & ObjectFlags::ToEnd)
|
|
|
|
last = first;
|
|
|
|
while (not is_begin(first))
|
2013-04-30 16:29:18 +04:00
|
|
|
{
|
2013-05-15 16:24:09 +04:00
|
|
|
char cur = *first;
|
|
|
|
char prev = *(first-1);
|
|
|
|
if (is_eol(prev) and is_eol(cur))
|
|
|
|
{
|
|
|
|
++first;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
--first;
|
2013-04-30 16:29:18 +04:00
|
|
|
}
|
|
|
|
}
|
2013-05-15 16:24:09 +04:00
|
|
|
if (flags & ObjectFlags::ToEnd)
|
2013-04-30 16:29:18 +04:00
|
|
|
{
|
2013-05-15 16:24:09 +04:00
|
|
|
while (not is_end(last))
|
2013-04-30 16:29:18 +04:00
|
|
|
{
|
2013-05-15 16:24:09 +04:00
|
|
|
char cur = *last;
|
|
|
|
char prev = *(last-1);
|
|
|
|
if (is_eol(cur) and is_eol(prev))
|
|
|
|
{
|
|
|
|
if (not (flags & ObjectFlags::Inner))
|
|
|
|
skip_while(last, is_eol);
|
|
|
|
--last;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
++last;
|
2013-04-30 16:29:18 +04:00
|
|
|
}
|
|
|
|
}
|
2013-05-15 16:24:09 +04:00
|
|
|
return (flags & ObjectFlags::ToEnd) ? Selection{first, last}
|
|
|
|
: Selection{last, first};
|
2013-04-30 16:29:18 +04:00
|
|
|
}
|
|
|
|
|
2012-11-30 21:32:49 +04:00
|
|
|
Selection select_whole_lines(const Selection& selection)
|
2011-11-21 22:53:22 +04:00
|
|
|
{
|
2013-01-03 17:30:14 +04:00
|
|
|
// no need to be utf8 aware for is_eol as we only use \n as line seperator
|
|
|
|
BufferIterator first = selection.first();
|
|
|
|
BufferIterator last = selection.last();
|
|
|
|
BufferIterator& to_line_start = first <= last ? first : last;
|
|
|
|
BufferIterator& to_line_end = first <= last ? last : first;
|
2011-11-21 22:53:22 +04:00
|
|
|
|
2013-01-03 17:30:14 +04:00
|
|
|
--to_line_start;
|
|
|
|
skip_while_reverse(to_line_start, [](char cur) { return not is_eol(cur); });
|
|
|
|
if (is_eol(*to_line_start))
|
|
|
|
++to_line_start;
|
2011-11-22 22:58:05 +04:00
|
|
|
|
2013-01-03 17:30:14 +04:00
|
|
|
skip_while(to_line_end, [](char cur) { return not is_eol(cur); });
|
2011-11-21 22:53:22 +04:00
|
|
|
|
2013-01-03 17:30:14 +04:00
|
|
|
return Selection(first, last);
|
2012-02-07 18:26:51 +04:00
|
|
|
}
|
|
|
|
|
2013-04-16 16:30:11 +04:00
|
|
|
Selection trim_partial_lines(const Selection& selection)
|
|
|
|
{
|
|
|
|
// same as select_whole_lines
|
|
|
|
BufferIterator first = selection.first();
|
|
|
|
BufferIterator last = selection.last();
|
|
|
|
BufferIterator& to_line_start = first <= last ? first : last;
|
|
|
|
BufferIterator& to_line_end = first <= last ? last : first;
|
|
|
|
|
|
|
|
while (not is_begin(to_line_start) and *(to_line_start-1) != '\n')
|
|
|
|
++to_line_start;
|
|
|
|
while (*(to_line_end+1) != '\n' and to_line_end != to_line_start)
|
|
|
|
--to_line_end;
|
|
|
|
|
|
|
|
return Selection(first, last);
|
|
|
|
}
|
|
|
|
|
2012-11-30 21:32:49 +04:00
|
|
|
Selection select_whole_buffer(const Selection& selection)
|
2012-02-07 18:26:51 +04:00
|
|
|
{
|
|
|
|
const Buffer& buffer = selection.first().buffer();
|
2012-10-08 21:12:09 +04:00
|
|
|
return Selection(buffer.begin(), utf8::previous(buffer.end()));
|
2011-11-21 22:53:22 +04:00
|
|
|
}
|
|
|
|
|
2013-01-08 21:46:45 +04:00
|
|
|
using MatchResults = boost::match_results<BufferIterator>;
|
|
|
|
|
|
|
|
static bool find_last_match(BufferIterator begin, const BufferIterator& end,
|
|
|
|
MatchResults& res, const Regex& regex)
|
|
|
|
{
|
|
|
|
MatchResults matches;
|
|
|
|
while (boost::regex_search(begin, end, matches, regex))
|
|
|
|
{
|
|
|
|
if (begin == matches[0].second)
|
|
|
|
break;
|
|
|
|
begin = matches[0].second;
|
|
|
|
res.swap(matches);
|
|
|
|
}
|
|
|
|
return not res.empty();
|
|
|
|
}
|
|
|
|
|
|
|
|
template<bool forward>
|
|
|
|
bool find_match_in_buffer(const BufferIterator pos, MatchResults& matches,
|
|
|
|
const Regex& ex)
|
|
|
|
{
|
|
|
|
auto bufbeg = pos.buffer().begin();
|
|
|
|
auto bufend = pos.buffer().end();
|
|
|
|
|
|
|
|
if (forward)
|
|
|
|
return (boost::regex_search(pos, bufend, matches, ex) or
|
|
|
|
boost::regex_search(bufbeg, pos, matches, ex));
|
|
|
|
else
|
|
|
|
return (find_last_match(bufbeg, pos, matches, ex) or
|
|
|
|
find_last_match(pos, bufend, matches, ex));
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
template<bool forward>
|
2013-04-05 21:28:08 +04:00
|
|
|
Selection select_next_match(const Selection& selection, const Regex& regex)
|
2011-11-21 23:08:51 +04:00
|
|
|
{
|
2013-04-05 21:28:08 +04:00
|
|
|
// regex matching do not use Utf8Iterator as boost::regex handle utf8
|
|
|
|
// decoding itself
|
|
|
|
BufferIterator begin = selection.last();
|
|
|
|
BufferIterator end = begin;
|
|
|
|
CaptureList captures;
|
2012-09-12 21:09:10 +04:00
|
|
|
|
2013-04-05 21:28:08 +04:00
|
|
|
MatchResults matches;
|
2012-03-05 00:11:22 +04:00
|
|
|
|
2013-04-05 21:28:08 +04:00
|
|
|
if (find_match_in_buffer<forward>(utf8::next(begin), matches, regex))
|
2011-11-21 23:08:51 +04:00
|
|
|
{
|
2013-04-05 21:28:08 +04:00
|
|
|
begin = matches[0].first;
|
|
|
|
end = matches[0].second;
|
|
|
|
for (auto& match : matches)
|
|
|
|
captures.push_back(String(match.first, match.second));
|
2011-11-21 23:08:51 +04:00
|
|
|
}
|
2013-04-05 21:28:08 +04:00
|
|
|
else
|
|
|
|
throw runtime_error("'" + regex.str() + "': no matches found");
|
|
|
|
|
|
|
|
if (begin == end)
|
|
|
|
++end;
|
|
|
|
|
|
|
|
end = utf8::previous(end);
|
|
|
|
if (not forward)
|
|
|
|
std::swap(begin, end);
|
|
|
|
return Selection{begin, end, std::move(captures)};
|
2011-11-21 23:08:51 +04:00
|
|
|
}
|
2013-04-05 21:28:08 +04:00
|
|
|
template Selection select_next_match<true>(const Selection&, const Regex&);
|
|
|
|
template Selection select_next_match<false>(const Selection&, const Regex&);
|
2011-11-21 23:08:51 +04:00
|
|
|
|
2013-04-05 21:28:08 +04:00
|
|
|
SelectionList select_all_matches(const Selection& selection, const Regex& regex)
|
2011-11-21 23:08:51 +04:00
|
|
|
{
|
2013-04-05 21:28:08 +04:00
|
|
|
RegexIterator re_it(selection.begin(), selection.end(), regex);
|
|
|
|
RegexIterator re_end;
|
2011-11-21 23:08:51 +04:00
|
|
|
|
2013-04-05 21:28:08 +04:00
|
|
|
SelectionList result;
|
|
|
|
for (; re_it != re_end; ++re_it)
|
|
|
|
{
|
|
|
|
BufferIterator begin = (*re_it)[0].first;
|
|
|
|
BufferIterator end = (*re_it)[0].second;
|
2012-03-05 00:11:22 +04:00
|
|
|
|
2013-04-05 21:28:08 +04:00
|
|
|
if (begin == selection.end())
|
|
|
|
continue;
|
2012-09-19 16:04:09 +04:00
|
|
|
|
2013-04-05 21:28:08 +04:00
|
|
|
CaptureList captures;
|
|
|
|
for (auto& match : *re_it)
|
|
|
|
captures.push_back(String(match.first, match.second));
|
2011-11-21 23:30:44 +04:00
|
|
|
|
2013-04-05 21:28:08 +04:00
|
|
|
result.push_back(Selection(begin, begin == end ? end : utf8::previous(end),
|
|
|
|
std::move(captures)));
|
2011-11-21 23:30:44 +04:00
|
|
|
}
|
2013-04-05 21:28:08 +04:00
|
|
|
return result;
|
2011-11-21 23:30:44 +04:00
|
|
|
}
|
|
|
|
|
2012-11-30 21:32:49 +04:00
|
|
|
SelectionList split_selection(const Selection& selection,
|
2013-04-05 21:28:08 +04:00
|
|
|
const Regex& regex)
|
2011-11-21 23:30:44 +04:00
|
|
|
{
|
2013-04-05 21:28:08 +04:00
|
|
|
RegexIterator re_it(selection.begin(), selection.end(), regex,
|
|
|
|
boost::regex_constants::match_nosubs);
|
|
|
|
RegexIterator re_end;
|
2011-11-21 23:30:44 +04:00
|
|
|
|
2013-04-05 21:28:08 +04:00
|
|
|
SelectionList result;
|
|
|
|
BufferIterator begin = selection.begin();
|
|
|
|
for (; re_it != re_end; ++re_it)
|
2012-03-05 00:11:22 +04:00
|
|
|
{
|
2013-04-05 21:28:08 +04:00
|
|
|
BufferIterator end = (*re_it)[0].first;
|
|
|
|
|
|
|
|
result.push_back(Selection(begin, (begin == end) ? end : utf8::previous(end)));
|
|
|
|
begin = (*re_it)[0].second;
|
2011-11-21 23:08:51 +04:00
|
|
|
}
|
2013-04-05 21:28:08 +04:00
|
|
|
result.push_back(Selection(begin, std::max(selection.first(),
|
|
|
|
selection.last())));
|
|
|
|
return result;
|
2011-11-21 23:08:51 +04:00
|
|
|
}
|
|
|
|
|
2011-09-21 18:37:09 +04:00
|
|
|
}
|