textwolf
0.2
|
character set encoding UTF-8 More...
#include <charset_utf8.hpp>
Classes | |
class | CharLengthTab |
Table that maps the first UTF-8 character byte to the length of the character in bytes. More... | |
Public Types | |
enum | { MaxChar =0x7FFFFFFFU } |
Maximum character that can be represented by this encoding implementation. More... | |
enum | { B11111111 =0xFF, B01111111 =0x7F, B00111111 =0x3F, B00011111 =0x1F, B00001111 =0x0F, B00000111 =0x07, B00000011 =0x03, B00000001 =0x01, B00000000 =0x00, B10000000 =0x80, B11000000 =0xC0, B11100000 =0xE0, B11110000 =0xF0, B11111000 =0xF8, B11111100 =0xFC, B11111110 =0xFE, B11011111 =B11000000|B00011111, B11101111 =B11100000|B00001111, B11110111 =B11110000|B00000111, B11111011 =B11111000|B00000011, B11111101 =B11111100|B00000001 } |
Public Member Functions | |
template<class Iterator > | |
UChar | value (char *buf, unsigned int &bufpos, Iterator &itr) const |
See template<class Iterator>Interface::value(char*,unsigned int&,Iterator&) More... | |
template<class Buffer_ > | |
void | print (UChar chr, Buffer_ &buf) const |
See template<class Buffer>Interface::print(UChar,Buffer&) More... | |
Static Public Member Functions | |
template<class Iterator > | |
static unsigned int | size (char *buf, unsigned int &bufpos, Iterator &itr) |
Get the size of the current character in bytes (variable length encoding) More... | |
template<class Iterator > | |
static void | skip (char *buf, unsigned int &bufpos, Iterator &itr) |
See template<class Iterator>Interface::skip(char*,unsigned int&,Iterator&) More... | |
template<class Iterator > | |
static signed char | asciichar (char *buf, unsigned int &bufpos, Iterator &itr) |
See template<class Iterator>Interface::asciichar(char*,unsigned int&,Iterator&) More... | |
template<class Iterator > | |
static void | fetchbytes (char *buf, unsigned int &bufpos, Iterator &itr) |
See template<class Iterator>Interface::fetch(char*,unsigned int&,Iterator&) More... | |
static bool | is_equal (const UTF8 &, const UTF8 &) |
See template<class Buffer>Interface::is_equal( const Interface&, const Interface&) More... | |
character set encoding UTF-8
anonymous enum |
anonymous enum |
|
inlinestatic |
See template<class Iterator>Interface::asciichar(char*,unsigned int&,Iterator&)
|
inlinestatic |
See template<class Iterator>Interface::fetch(char*,unsigned int&,Iterator&)
See template<class Buffer>Interface::is_equal( const Interface&, const Interface&)
|
inline |
See template<class Buffer>Interface::print(UChar,Buffer&)
|
inlinestatic |
Get the size of the current character in bytes (variable length encoding)
[in] | buf | buffer for the character data |
[in,out] | bufpos | position in 'buf' |
[in,out] | itr | iterator to skip |
|
inlinestatic |
See template<class Iterator>Interface::skip(char*,unsigned int&,Iterator&)
|
inline |
See template<class Iterator>Interface::value(char*,unsigned int&,Iterator&)