27#ifndef UTF8_FOR_CPP_UNCHECKED_H_2675DCD0_9480_4c0c_B92A_CC14C027B731
28#define UTF8_FOR_CPP_UNCHECKED_H_2675DCD0_9480_4c0c_B92A_CC14C027B731
32namespace utf8::unchecked
34 template <
typename octet_iterator>
35 octet_iterator append(uint32_t cp, octet_iterator result)
38 *(result++) =
static_cast<uint8_t
>(cp);
39 }
else if (cp < 0x800) {
40 *(result++) =
static_cast<uint8_t
>((cp >> 6) | 0xc0);
41 *(result++) =
static_cast<uint8_t
>((cp & 0x3f) | 0x80);
42 }
else if (cp < 0x10000) {
43 *(result++) =
static_cast<uint8_t
>((cp >> 12) | 0xe0);
44 *(result++) =
static_cast<uint8_t
>(((cp >> 6) & 0x3f) | 0x80);
45 *(result++) =
static_cast<uint8_t
>((cp & 0x3f) | 0x80);
47 *(result++) =
static_cast<uint8_t
>((cp >> 18) | 0xf0);
48 *(result++) =
static_cast<uint8_t
>(((cp >> 12) & 0x3f) | 0x80);
49 *(result++) =
static_cast<uint8_t
>(((cp >> 6) & 0x3f) | 0x80);
50 *(result++) =
static_cast<uint8_t
>((cp & 0x3f) | 0x80);
55 template <
typename octet_iterator>
56 uint32_t next(octet_iterator& it)
58 uint32_t cp = utf8::internal::mask8(*it);
59 typename std::iterator_traits<octet_iterator>::difference_type length = utf8::internal::sequence_length(it);
65 cp = ((cp << 6) & 0x7ff) + ((*it) & 0x3f);
69 cp = ((cp << 12) & 0xffff) + ((utf8::internal::mask8(*it) << 6) & 0xfff);
75 cp = ((cp << 18) & 0x1fffff) + ((utf8::internal::mask8(*it) << 12) & 0x3ffff);
77 cp += (utf8::internal::mask8(*it) << 6) & 0xfff;
86 template <
typename octet_iterator>
87 uint32_t peek_next(octet_iterator it)
89 return utf8::unchecked::next(it);
92 template <
typename octet_iterator>
93 uint32_t prior(octet_iterator& it)
95 while (utf8::internal::is_trail(*(--it))) {
98 octet_iterator temp = it;
99 return utf8::unchecked::next(temp);
103 template <
typename octet_iterator>
104 inline uint32_t previous(octet_iterator& it)
106 return utf8::unchecked::prior(it);
109 template <
typename octet_iterator,
typename distance_type>
110 void advance(octet_iterator& it, distance_type n)
112 for (distance_type i = 0; i < n; ++i) {
113 utf8::unchecked::next(it);
117 template <
typename octet_iterator>
118 typename std::iterator_traits<octet_iterator>::difference_type distance(octet_iterator first, octet_iterator last)
120 typename std::iterator_traits<octet_iterator>::difference_type dist;
121 for (dist = 0; first < last; ++dist) {
122 utf8::unchecked::next(first);
127 template <
typename u16bit_iterator,
typename octet_iterator>
128 octet_iterator utf16to8(u16bit_iterator start, u16bit_iterator end, octet_iterator result)
130 while (start != end) {
131 uint32_t cp = utf8::internal::mask16(*start++);
133 if (utf8::internal::is_lead_surrogate(cp)) {
134 uint32_t trail_surrogate = utf8::internal::mask16(*start++);
135 cp = (cp << 10) + trail_surrogate + internal::SURROGATE_OFFSET;
137 result = utf8::unchecked::append(cp, result);
142 template <
typename u16bit_iterator,
typename octet_iterator>
143 u16bit_iterator utf8to16(octet_iterator start, octet_iterator end, u16bit_iterator result)
145 while (start < end) {
146 uint32_t cp = utf8::unchecked::next(start);
148 *result++ =
static_cast<uint16_t
>((cp >> 10) + internal::LEAD_OFFSET);
149 *result++ =
static_cast<uint16_t
>((cp & 0x3ff) + internal::TRAIL_SURROGATE_MIN);
151 *result++ =
static_cast<uint16_t
>(cp);
157 template <
typename octet_iterator,
typename u32bit_iterator>
158 octet_iterator utf32to8(u32bit_iterator start, u32bit_iterator end, octet_iterator result)
160 while (start != end) {
161 result = utf8::unchecked::append(*(start++), result);
167 template <
typename octet_iterator,
typename u32bit_iterator>
168 u32bit_iterator utf8to32(octet_iterator start, octet_iterator end, u32bit_iterator result)
170 while (start < end) {
171 (*result++) = utf8::unchecked::next(start);
178 template <
typename octet_iterator>
184 using iterator_category = std::bidirectional_iterator_tag;
185 using value_type = uint32_t;
186 using difference_type = std::ptrdiff_t;
187 using pointer = uint32_t*;
188 using reference = uint32_t&;
190 iterator() =
default;
191 explicit iterator(octet_iterator
const & octet_it) : it(octet_it) { }
193 octet_iterator base()
const
198 uint32_t operator*()
const
200 octet_iterator temp = it;
201 return utf8::unchecked::next(temp);
204 bool operator==(iterator
const & rhs)
const
206 return (it == rhs.it);
209 bool operator!=(iterator
const & rhs)
const
211 return !(operator==(rhs));
214 iterator& operator++()
216 std::advance(it, utf8::internal::sequence_length(it));
220 iterator operator++(
int)
222 iterator temp = *
this;
223 std::advance(it, utf8::internal::sequence_length(it));
227 iterator& operator--()
229 utf8::unchecked::prior(it);
233 iterator operator--(
int)
235 iterator temp = *
this;
236 utf8::unchecked::prior(it);