blob: 464aff3a8d72e0b228b77712defde87ba3dfa298 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
|
#ifndef utf8_iterator_hh_INCLUDED
#define utf8_iterator_hh_INCLUDED
#include "utf8.hh"
namespace Kakoune
{
namespace utf8
{
// adapter for an iterator on bytes which permits to iterate
// on unicode codepoints instead.
template<typename Iterator,
typename InvalidPolicy = InvalidBytePolicy::Assert>
class utf8_iterator
{
public:
utf8_iterator() = default;
utf8_iterator(Iterator it) : m_it(std::move(it)) {}
utf8_iterator& operator++()
{
m_it = utf8::next(m_it);
invalidate_value();
return *this;
}
utf8_iterator operator++(int)
{
utf8_iterator save = *this;
++*this;
return save;
}
utf8_iterator& operator--()
{
m_it = utf8::previous(m_it);
invalidate_value();
return *this;
}
utf8_iterator operator--(int)
{
utf8_iterator save = *this;
--*this;
return save;
}
utf8_iterator operator+(CharCount count) const
{
if (count < 0)
return operator-(-count);
utf8_iterator res = *this;
while (count--)
++res;
return res;
}
utf8_iterator operator-(CharCount count) const
{
if (count < 0)
return operator+(-count);
utf8_iterator res = *this;
while (count--)
--res;
return res;
}
bool operator==(const utf8_iterator& other) { return m_it == other.m_it; }
bool operator!=(const utf8_iterator& other) { return m_it != other.m_it; }
bool operator< (const utf8_iterator& other) const
{
return m_it < other.m_it;
}
bool operator<= (const utf8_iterator& other) const
{
return m_it <= other.m_it;
}
bool operator> (const utf8_iterator& other) const
{
return m_it > other.m_it;
}
bool operator>= (const utf8_iterator& other) const
{
return m_it >= other.m_it;
}
CharCount operator-(utf8_iterator other) const
{
//assert(other < *this);
check_invariant();
other.check_invariant();
CharCount dist = 0;
while (other.m_it != m_it)
{
++dist;
++other;
}
return dist;
}
Codepoint operator*() const
{
return get_value();
}
const Iterator& underlying_iterator() const { return m_it; }
Iterator& underlying_iterator() { return m_it; }
protected:
void check_invariant() const
{
// always point to a character first byte;
// assert(is_character_start(it));
}
private:
void invalidate_value() { m_value = -1; }
Codepoint get_value() const
{
if (m_value == -1)
m_value = utf8::codepoint<InvalidPolicy>(m_it);
return m_value;
}
Iterator m_it;
mutable Codepoint m_value = -1;
};
}
}
#endif // utf8_iterator_hh_INCLUDED
|