Specialization of the Utf template for UTF-8. More...
#include <Utf.hpp>
Static Public Member Functions | |
template<typename In > | |
static In | decode (In begin, In end, Uint32 &output, Uint32 replacement=0) |
Decode a single UTF-8 character. | |
template<typename Out > | |
static Out | encode (Uint32 input, Out output, Uint8 replacement=0) |
Encode a single UTF-8 character. | |
template<typename In > | |
static In | next (In begin, In end) |
Advance to the next UTF-8 character. | |
template<typename In > | |
static std::size_t | count (In begin, In end) |
Count the number of characters of a UTF-8 sequence. | |
template<typename In , typename Out > | |
static Out | fromAnsi (In begin, In end, Out output, const std::locale &locale=std::locale()) |
Convert an ANSI characters range to UTF-8. | |
template<typename In , typename Out > | |
static Out | fromWide (In begin, In end, Out output) |
Convert a wide characters range to UTF-8. | |
template<typename In , typename Out > | |
static Out | fromLatin1 (In begin, In end, Out output) |
Convert a latin-1 (ISO-5589-1) characters range to UTF-8. | |
template<typename In , typename Out > | |
static Out | toAnsi (In begin, In end, Out output, char replacement=0, const std::locale &locale=std::locale()) |
Convert an UTF-8 characters range to ANSI characters. | |
template<typename In , typename Out > | |
static Out | toWide (In begin, In end, Out output, wchar_t replacement=0) |
Convert an UTF-8 characters range to wide characters. | |
template<typename In , typename Out > | |
static Out | toLatin1 (In begin, In end, Out output, char replacement=0) |
Convert an UTF-8 characters range to latin-1 (ISO-5589-1) characters. | |
template<typename In , typename Out > | |
static Out | toUtf8 (In begin, In end, Out output) |
Convert a UTF-8 characters range to UTF-8. | |
template<typename In , typename Out > | |
static Out | toUtf16 (In begin, In end, Out output) |
Convert a UTF-8 characters range to UTF-16. | |
template<typename In , typename Out > | |
static Out | toUtf32 (In begin, In end, Out output) |
Convert a UTF-8 characters range to UTF-32. | |
Specialization of the Utf template for UTF-8.
|
static |
Count the number of characters of a UTF-8 sequence.
This function is necessary for multi-elements encodings, as a single character may use more than 1 storage element, thus the total size can be different from (begin - end).
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
|
static |
Decode a single UTF-8 character.
Decoding a character means finding its unique 32-bits code (called the codepoint) in the Unicode standard.
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
output | Codepoint of the decoded UTF-8 character |
replacement | Replacement character to use in case the UTF-8 sequence is invalid |
|
static |
Encode a single UTF-8 character.
Encoding a character means converting a unique 32-bits code (called the codepoint) in the target encoding, UTF-8.
input | Codepoint to encode as UTF-8 |
output | Iterator pointing to the beginning of the output sequence |
replacement | Replacement for characters not convertible to UTF-8 (use 0 to skip them) |
|
static |
Convert an ANSI characters range to UTF-8.
The current global locale will be used by default, unless you pass a custom one in the locale parameter.
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
output | Iterator pointing to the beginning of the output sequence |
locale | Locale to use for conversion |
|
static |
Convert a latin-1 (ISO-5589-1) characters range to UTF-8.
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
output | Iterator pointing to the beginning of the output sequence |
|
static |
Convert a wide characters range to UTF-8.
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
output | Iterator pointing to the beginning of the output sequence |
|
static |
Advance to the next UTF-8 character.
This function is necessary for multi-elements encodings, as a single character may use more than 1 storage element.
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
|
static |
Convert an UTF-8 characters range to ANSI characters.
The current global locale will be used by default, unless you pass a custom one in the locale parameter.
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
output | Iterator pointing to the beginning of the output sequence |
replacement | Replacement for characters not convertible to ANSI (use 0 to skip them) |
locale | Locale to use for conversion |
|
static |
Convert an UTF-8 characters range to latin-1 (ISO-5589-1) characters.
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
output | Iterator pointing to the beginning of the output sequence |
replacement | Replacement for characters not convertible to wide (use 0 to skip them) |
|
static |
Convert a UTF-8 characters range to UTF-16.
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
output | Iterator pointing to the beginning of the output sequence |
|
static |
Convert a UTF-8 characters range to UTF-32.
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
output | Iterator pointing to the beginning of the output sequence |
|
static |
Convert a UTF-8 characters range to UTF-8.
This functions does nothing more than a direct copy; it is defined only to provide the same interface as other specializations of the sf::Utf<> template, and allow generic code to be written on top of it.
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
output | Iterator pointing to the beginning of the output sequence |
|
static |
Convert an UTF-8 characters range to wide characters.
begin | Iterator pointing to the beginning of the input sequence |
end | Iterator pointing to the end of the input sequence |
output | Iterator pointing to the beginning of the output sequence |
replacement | Replacement for characters not convertible to wide (use 0 to skip them) |