|
|
|
|
|
|
Modules Namespace List Class Hierarchy Alphabetical List Compound List Namespace Members Compound Members Related Pages
acdk::lang::StringUtf8Utils Struct Reference#include <StringUtf8Utils.h>
List of all members.
Detailed Description
Internal Helper class to handle UTF8 strings.
|
Public Types |
enum | UtfStreamType { StreamIsAscii,
StreamIsUtf8,
StreamIsError
} |
Static Public Member Functions |
void | incUtfPtr (const char *&ptr, const char *endptr) |
void | decUtfPtr (const char *&ptr, const char *beginptr) |
size_t | utfDiff (const char *end, const char *begin) |
bool | isAscii (const char *begin, const char *end) |
ucchar | fetchWideChar (const char *&begin, const char *end) |
ucchar | toWideChar (const char *begin, const char *end) |
int | getByteLength (const char *it) |
int | utflength (ucchar ch) |
| return the number of byte a unicode character needs
|
int | utflength (const ucchar *begin, const ucchar *end) |
| returns the number of bytes a unicode string needs
|
int | utflength (const ucchar *begin) |
UtfStreamType | validUtf8Stream (const byte *begin, const byte *end, bool throwOnFail=true) |
| check if the character byte stream is a valid UTF8 stream.
|
int | uclength (const ucchar *ch) |
| returns the length of 0 terminated unicode character string
|
int | uc2length (const uc2char *ch) |
int | uc4length (const uc4char *ch) |
| returns the length of an 0-terminated uc4char stream
|
int | writeUcToUtf8 (byte *&it, byte *end, ucchar ucc) |
| writes an unicode char into given chars
|
int | writeUcToUtf8 (byte *&it, byte *end, const ucchar *ucbegin, const ucchar *ucend) |
| writes the given unicode character range into 8bit char range
|
ucchar * | uc4touc (ucchar *buffer, const uc4char *source, int length=-1) |
| converts an uc4 character stream to ucchar stream.
|
ucchar * | wcchartouc (ucchar *buffer, const wchar_t *source, int length=-1) |
size_t | stringlength (const char *str) |
size_t | stringlength (const ucchar *str) |
size_t | stringlength (const uc4char *str) |
template<typename ToCharType, typename FromCharType> ToCharType * | convertTo (ToCharType *buffer, const FromCharType *source, int length=-1) |
Member Enumeration Documentation
|
- Enumeration values:
-
StreamIsAscii |
|
StreamIsUtf8 |
|
StreamIsError |
|
|
Member Function Documentation
template<typename ToCharType, typename FromCharType> |
ToCharType* acdk::lang::StringUtf8Utils::convertTo |
( |
ToCharType * |
buffer, |
|
|
const FromCharType * |
source, |
|
|
int |
length = -1 |
|
) |
[inline, static] |
|
void acdk::lang::StringUtf8Utils::decUtfPtr |
( |
const char *& |
ptr, |
|
|
const char * |
beginptr |
|
) |
[static] |
|
ucchar acdk::lang::StringUtf8Utils::fetchWideChar |
( |
const char *& |
begin, |
|
|
const char * |
end |
|
) |
[static] |
|
int acdk::lang::StringUtf8Utils::getByteLength |
( |
const char * |
it |
) |
[static] |
|
void acdk::lang::StringUtf8Utils::incUtfPtr |
( |
const char *& |
ptr, |
|
|
const char * |
endptr |
|
) |
[static] |
|
bool acdk::lang::StringUtf8Utils::isAscii |
( |
const char * |
begin, |
|
|
const char * |
end |
|
) |
[static] |
|
size_t acdk::lang::StringUtf8Utils::stringlength |
( |
const uc4char * |
str |
) |
[inline, static] |
|
size_t acdk::lang::StringUtf8Utils::stringlength |
( |
const ucchar * |
str |
) |
[inline, static] |
|
size_t acdk::lang::StringUtf8Utils::stringlength |
( |
const char * |
str |
) |
[inline, static] |
|
ucchar acdk::lang::StringUtf8Utils::toWideChar |
( |
const char * |
begin, |
|
|
const char * |
end |
|
) |
[inline, static] |
|
int acdk::lang::StringUtf8Utils::uc2length |
( |
const uc2char * |
ch |
) |
[inline, static] |
|
int acdk::lang::StringUtf8Utils::uc4length |
( |
const uc4char * |
ch |
) |
[static] |
|
|
returns the length of an 0-terminated uc4char stream
|
ucchar* acdk::lang::StringUtf8Utils::uc4touc |
( |
ucchar * |
buffer, |
|
|
const uc4char * |
source, |
|
|
int |
length = -1 |
|
) |
[static] |
|
|
converts an uc4 character stream to ucchar stream.
uc4 chars cannot be mappend are mapped to 0xFFFF
buffer must have enough space to get all length + 1 chars - Parameters:
-
buffer | target to write |
source | 0 terminated uc4char stream |
length | length of source, -1 if 0 terminated uc4 string |
- Returns:
- just the buffer
|
int acdk::lang::StringUtf8Utils::uclength |
( |
const ucchar * |
ch |
) |
[static] |
|
|
returns the length of 0 terminated unicode character string
|
size_t acdk::lang::StringUtf8Utils::utfDiff |
( |
const char * |
end, |
|
|
const char * |
begin |
|
) |
[static] |
|
int acdk::lang::StringUtf8Utils::utflength |
( |
const ucchar * |
begin |
) |
[inline, static] |
|
int acdk::lang::StringUtf8Utils::utflength |
( |
const ucchar * |
begin, |
|
|
const ucchar * |
end |
|
) |
[static] |
|
|
returns the number of bytes a unicode string needs
|
int acdk::lang::StringUtf8Utils::utflength |
( |
ucchar |
ch |
) |
[static] |
|
|
return the number of byte a unicode character needs
|
UtfStreamType acdk::lang::StringUtf8Utils::validUtf8Stream |
( |
const byte * |
begin, |
|
|
const byte * |
end, |
|
|
bool |
throwOnFail = true |
|
) |
[static] |
|
|
check if the character byte stream is a valid UTF8 stream.
if throwOnFail is true, UTFDataFormatException will be thrown |
ucchar* acdk::lang::StringUtf8Utils::wcchartouc |
( |
ucchar * |
buffer, |
|
|
const wchar_t * |
source, |
|
|
int |
length = -1 |
|
) |
[static] |
|
int acdk::lang::StringUtf8Utils::writeUcToUtf8 |
( |
byte *& |
it, |
|
|
byte * |
end, |
|
|
const ucchar * |
ucbegin, |
|
|
const ucchar * |
ucend |
|
) |
[static] |
|
|
writes the given unicode character range into 8bit char range
- Parameters:
-
it | start position to write. will be modified and points to next writing position after this method call |
end | capacity position, if 0 no checking for end is done |
- Returns:
- 0 is Ok -1 is error > 0 need byte chars to encode to end
|
int acdk::lang::StringUtf8Utils::writeUcToUtf8 |
( |
byte *& |
it, |
|
|
byte * |
end, |
|
|
ucchar |
ucc |
|
) |
[static] |
|
|
writes an unicode char into given chars
- Parameters:
-
it | start position to write. will be modified and points to next writing position after this method call |
end | capacity position, if 0 no checking for end is done |
- Returns:
- 0 is Ok -1 is error > 0 need chars to encode given unicode character to end in case of return value != 0 it position will not be changed.
|
|
|