28#ifndef UTF8_FOR_CPP_UNCHECKED_H_2675DCD0_9480_4c0c_B92A_CC14C027B731
29#define UTF8_FOR_CPP_UNCHECKED_H_2675DCD0_9480_4c0c_B92A_CC14C027B731
37 template <
typename octet_iterator>
43 template <
typename word_iterator>
49 template <
typename octet_iterator,
typename output_iterator>
52 while (start != end) {
53 octet_iterator sequence_start = start;
57 for (octet_iterator it = sequence_start; it != start; ++it)
82 template <
typename octet_iterator,
typename output_iterator>
83 inline output_iterator
replace_invalid(octet_iterator start, octet_iterator end, output_iterator out)
92 replace_invalid(s.begin(), s.end(), std::back_inserter(result), replacement);
103 template <
typename octet_iterator>
112 cp = ((cp << 6) & 0x7ff) + ((*it) & 0x3f);
118 cp =
static_cast<utfchar32_t>(cp + ((*it) & 0x3f));
126 cp =
static_cast<utfchar32_t>(cp + ((*it) & 0x3f));
133 template <
typename octet_iterator>
139 template <
typename word_iterator>
148 template <
typename octet_iterator>
152 octet_iterator temp = it;
156 template <
typename octet_iterator,
typename distance_type>
157 void advance(octet_iterator& it, distance_type n)
159 const distance_type zero(0);
162 for (distance_type i = n; i < zero; ++i)
166 for (distance_type i = zero; i < n; ++i)
171 template <
typename octet_iterator>
172 typename std::iterator_traits<octet_iterator>::difference_type
173 distance(octet_iterator first, octet_iterator last)
175 typename std::iterator_traits<octet_iterator>::difference_type dist;
176 for (dist = 0; first < last; ++dist)
181 template <
typename u16bit_iterator,
typename octet_iterator>
182 octet_iterator
utf16to8(u16bit_iterator start, u16bit_iterator end, octet_iterator result)
184 while (start != end) {
198 template <
typename u16bit_iterator,
typename octet_iterator>
199 u16bit_iterator
utf8to16(octet_iterator start, octet_iterator end, u16bit_iterator result)
201 while (start < end) {
213 template <
typename octet_iterator,
typename u32bit_iterator>
214 octet_iterator
utf32to8(u32bit_iterator start, u32bit_iterator end, octet_iterator result)
222 template <
typename octet_iterator,
typename u32bit_iterator>
223 u32bit_iterator
utf8to32(octet_iterator start, octet_iterator end, u32bit_iterator result)
232 template <
typename octet_iterator>
242 explicit iterator (
const octet_iterator& octet_it): it(octet_it) {}
244 octet_iterator
base ()
const {
return it; }
247 octet_iterator temp = it;
252 return (it == rhs.it);
iterator(const octet_iterator &octet_it)
bool operator!=(const iterator &rhs) const
octet_iterator base() const
std::ptrdiff_t difference_type
utfchar32_t operator*() const
bool operator==(const iterator &rhs) const
std::bidirectional_iterator_tag iterator_category
bool is_lead_surrogate(utfchar32_t cp)
octet_iterator append(utfchar32_t cp, octet_iterator result)
const utfchar32_t SURROGATE_OFFSET
utfchar8_t mask8(octet_type oc)
utfchar16_t mask16(u16_type oc)
word_iterator append16(utfchar32_t cp, word_iterator result)
bool is_trail(octet_type oc)
utf_error validate_next(octet_iterator &it, octet_iterator end, utfchar32_t &code_point)
int sequence_length(octet_iterator lead_it)
const utfchar16_t TRAIL_SURROGATE_MIN
const utfchar16_t LEAD_OFFSET
octet_iterator append(utfchar32_t cp, octet_iterator result)
utfchar32_t next16(word_iterator &it)
void advance(octet_iterator &it, distance_type n)
word_iterator append16(utfchar32_t cp, word_iterator result)
u32bit_iterator utf8to32(octet_iterator start, octet_iterator end, u32bit_iterator result)
utfchar32_t prior(octet_iterator &it)
utfchar32_t next(octet_iterator &it)
output_iterator replace_invalid(octet_iterator start, octet_iterator end, output_iterator out, utfchar32_t replacement)
octet_iterator utf16to8(u16bit_iterator start, u16bit_iterator end, octet_iterator result)
u16bit_iterator utf8to16(octet_iterator start, octet_iterator end, u16bit_iterator result)
octet_iterator utf32to8(u32bit_iterator start, u32bit_iterator end, octet_iterator result)
utfchar32_t peek_next(octet_iterator it)
unsigned short utfchar16_t