SNAP Library 6.0, User Reference
2020-12-09 16:24:20
SNAP, a general purpose, high performance system for analysis and manipulation of large networks
|
#include <unicode.h>
Public Types | |
typedef TUniChDb::TCaseConversion | TCaseConversion |
Public Member Functions | |
TUnicode () | |
TUnicode (const TStr &fnBinUcd) | |
void | Init () |
int | DecodeUtf8 (const TIntV &src, TIntV &dest) const |
int | DecodeUtf8 (const TStr &src, TIntV &dest) const |
int | EncodeUtf8 (const TIntV &src, TIntV &dest) const |
TStr | EncodeUtf8Str (const TIntV &src) const |
int | DecodeUtf16FromBytes (const TIntV &src, TIntV &dest, const TUtf16BomHandling bomHandling=bomAllowed, const TUniByteOrder defaultByteOrder=boMachineEndian) const |
int | DecodeUtf16FromWords (const TIntV &src, TIntV &dest, const TUtf16BomHandling bomHandling=bomAllowed, const TUniByteOrder defaultByteOrder=boMachineEndian) const |
int | EncodeUtf16ToWords (const TIntV &src, TIntV &dest, const bool insertBom, const TUniByteOrder destByteOrder=boMachineEndian) const |
int | EncodeUtf16ToBytes (const TIntV &src, TIntV &dest, const bool insertBom, const TUniByteOrder destByteOrder=boMachineEndian) const |
void | RegisterCodec (const TStr &nameList, const PCodecBase &codec) |
void | UnregisterCodec (const TStr &nameList) |
void | ClrCodecs () |
void | InitCodecs () |
PCodecBase | GetCodec (const TStr &name) const |
void | GetAllCodecs (TCodecBaseV &dest) const |
bool | FindNextWordBoundary (const TIntV &src, int &position) const |
void | FindWordBoundaries (const TIntV &src, TBoolV &dest) const |
bool | FindNextSentenceBoundary (const TIntV &src, int &position) const |
void | FindSentenceBoundaries (const TIntV &src, TBoolV &dest) const |
void | ClrSentenceBoundaryExceptions () |
void | UseEnglishSentenceBoundaryExceptions () |
void | Decompose (const TIntV &src, TIntV &dest, bool compatibility) const |
void | Compose (const TIntV &src, TIntV &dest) const |
void | DecomposeAndCompose (const TIntV &src, TIntV &dest, bool compatibility) const |
int | ExtractStarters (const TIntV &src, TIntV &dest) const |
int | ExtractStarters (TIntV &src) const |
void | GetLowerCase (const TIntV &src, TIntV &dest) const |
void | GetUpperCase (const TIntV &src, TIntV &dest) const |
void | GetTitleCase (const TIntV &src, TIntV &dest) const |
void | GetSimpleLowerCase (const TIntV &src, TIntV &dest) const |
void | GetSimpleUpperCase (const TIntV &src, TIntV &dest) const |
void | GetSimpleTitleCase (const TIntV &src, TIntV &dest) const |
void | ToSimpleUpperCase (TIntV &src) const |
void | ToSimpleLowerCase (TIntV &src) const |
void | ToSimpleTitleCase (TIntV &src) const |
void | GetCaseFolded (const TIntV &src, TIntV &dest, const bool full=true) const |
void | ToCaseFolded (TIntV &src) const |
TStr | GetUtf8CaseFolded (const TStr &s) const |
DECLARE_FORWARDED_PROPERTY_METHODS | ___UniFwd2 (IsPrivateUse, IsSurrogate) TUniChCategory GetCat(const int cp) const |
TUniChSubCategory | GetSubCat (const int cp) const |
const char * | GetCharName (const int cp) const |
TStr | GetCharNameS (const int cp) const |
Static Public Member Functions | |
static void | EncodeUtf8 (const uint &Ch, TChA &Dest) |
static TStr | EncodeUtf8 (const uint &Ch) |
Static Protected Member Functions | |
static TStr | NormalizeCodecName (const TStr &name) |
Protected Attributes | |
THash< TStr, PCodecBase > | codecs |
|
inlineexplicit |
|
inline |
Definition at line 1941 of file unicode.h.
|
inline |
Definition at line 1810 of file unicode.h.
|
inline |
Definition at line 1823 of file unicode.h.
Definition at line 1787 of file unicode.h.
Definition at line 1788 of file unicode.h.
Definition at line 1934 of file unicode.h.
|
inline |
Definition at line 1946 of file unicode.h.
|
inline |
Definition at line 1838 of file unicode.h.
|
inline |
Definition at line 1834 of file unicode.h.
Definition at line 1792 of file unicode.h.
Definition at line 1696 of file unicode.cpp.
Definition at line 1728 of file unicode.cpp.
Definition at line 1796 of file unicode.h.
Definition at line 1951 of file unicode.h.
|
inline |
Definition at line 1953 of file unicode.h.
|
inline |
Definition at line 1916 of file unicode.h.
|
inline |
Definition at line 1901 of file unicode.h.
Definition at line 1922 of file unicode.h.
Definition at line 1907 of file unicode.h.
|
inline |
|
inline |
Definition at line 1989 of file unicode.h.
|
inline |
|
inline |
Definition at line 1883 of file unicode.h.
Definition at line 1965 of file unicode.h.
Definition at line 1972 of file unicode.h.
Definition at line 1974 of file unicode.h.
Definition at line 1973 of file unicode.h.
|
inline |
Definition at line 1967 of file unicode.h.
Definition at line 1966 of file unicode.h.
Definition at line 1994 of file unicode.h.
void TUnicode::InitCodecs | ( | ) |
Definition at line 1683 of file unicode.cpp.
Definition at line 1870 of file unicode.h.
|
inline |
Definition at line 1873 of file unicode.h.
|
inline |
Definition at line 1992 of file unicode.h.
|
inline |
Definition at line 1978 of file unicode.h.
|
inline |
Definition at line 1979 of file unicode.h.
|
inline |
Definition at line 1977 of file unicode.h.
|
inline |
Definition at line 1877 of file unicode.h.
|
inline |
|
protected |
T8BitCodec<TEncoding_CP1250> TUnicode::cp1250 |
T8BitCodec<TEncoding_CP437> TUnicode::cp437 |
T8BitCodec<TEncoding_CP852> TUnicode::cp852 |
T8BitCodec<TEncoding_ISO8859_1> TUnicode::iso8859_1 |
T8BitCodec<TEncoding_ISO8859_2> TUnicode::iso8859_2 |
T8BitCodec<TEncoding_ISO8859_3> TUnicode::iso8859_3 |
T8BitCodec<TEncoding_ISO8859_4> TUnicode::iso8859_4 |
T8BitCodec<TEncoding_YuAscii> TUnicode::yuAscii |