SNAP Library 6.0, Developer Reference  2020-12-09 16:24:20
SNAP, a general purpose, high performance system for analysis and manipulation of large networks
TUniChInfo Class Reference

#include <unicode.h>

Public Types

enum  {
  ccStarter = 0, ccOverlaysAndInterior = 1, ccNuktas = 7, ccHiraganaKatakanaVoicingMarks = 8,
  ccViramas = 9, ccFixedPositionStart = 10, ccFixedPositionEnd = 199, ccBelowLeftAttached = 200,
  ccBelowAttached = 202, ccBelowRightAttached = 204, ccLeftAttached = 208, ccRightAttached = 210,
  ccAboveLeftAttached = 212, ccAboveAttached = 214, ccAboveRightAttached = 216, ccBelowLeft = 218,
  ccBelow = 220, ccBelowRight = 222, ccLeft = 224, ccRight = 226,
  ccAboveLeft = 228, ccAbove = 230, ccAboveRight = 232, ccDoubleBelow = 233,
  ccDoubleAbove = 234, ccBelowIotaSubscript = 240, ccInvalid = 255
}
 

Public Member Functions

void InitAfterLoad ()
 
void SetCatAndSubCat (const TUniChSubCategory catAndSubCat)
 
void Save (TSOut &SOut) const
 
void Load (TSIn &SIn)
 
 TUniChInfo (TSIn &SIn)
 
 TUniChInfo ()
 
bool IsDcpFlag (const TUniChFlags flag) const
 
void ClrDcpFlags ()
 
void SetDcpFlag (const TUniChFlags flag)
 
bool IsAlphabetic () const
 
bool IsUppercase () const
 
bool IsLowercase () const
 
bool IsMath () const
 
bool IsDefaultIgnorable () const
 
bool IsGraphemeBase () const
 
bool IsGraphemeExtend () const
 
bool IsIdStart () const
 
bool IsIdContinue () const
 
bool IsXidStart () const
 
bool IsXidContinue () const
 
bool IsProperty (const TUniChProperties flag) const
 
void SetProperty (const TUniChProperties flag)
 
bool IsAsciiHexDigit () const
 
bool IsBidiControl () const
 
bool IsDash () const
 
bool IsDeprecated () const
 
bool IsDiacritic () const
 
bool IsExtender () const
 
bool IsGraphemeLink () const
 
bool IsHexDigit () const
 
bool IsHyphen () const
 
bool IsIdeographic () const
 
bool IsJoinControl () const
 
bool IsLogicalOrderException () const
 
bool IsNoncharacter () const
 
bool IsQuotationMark () const
 
bool IsSoftDotted () const
 
bool IsSTerminal () const
 
bool IsTerminalPunctuation () const
 
bool IsVariationSelector () const
 
bool IsWhiteSpace () const
 
bool IsPropertyX (const TUniChPropertiesX flag) const
 
void SetPropertyX (const TUniChPropertiesX flag)
 
bool IsCompositionExclusion () const
 
bool IsCompatibilityDecomposition () const
 
bool IsWbFlag (const TUniChFlags flag) const
 
void ClrWbAndSbFlags ()
 
void SetWbFlag (const TUniChFlags flag)
 
int GetWbFlags () const
 
bool IsWbFormat () const
 
TStr GetWbFlagsStr () const
 
bool IsSbFlag (const TUniChFlags flag) const
 
void SetSbFlag (const TUniChFlags flag)
 
int GetSbFlags () const
 
bool IsSbFormat () const
 
TStr GetSbFlagsStr () const
 
bool IsSbSep () const
 
bool IsGbExtend () const
 
bool IsCased () const
 
TUniChCategory GetCat () const
 
TUniChSubCategory GetSubCat () const
 
bool IsCurrency () const
 
bool IsPrivateUse () const
 
bool IsSurrogate () const
 

Static Public Member Functions

static ushort GetLineBreakCode (char c1, char c2)
 
static void LoadUShort (TSIn &SIn, ushort &u)
 
static void LoadSChar (TSIn &SIn, signed char &u)
 
static void SaveUShort (TSOut &SOut, ushort u)
 
static void SaveSChar (TSOut &SOut, signed char u)
 
static TStr GetWbFlagsStr (const int flags)
 
static TStr GetSbFlagsStr (const int flags)
 
static bool IsValidSubCat (const char chCat, const char chSubCat)
 

Public Attributes

char chCat
 
char chSubCat
 
uchar combClass
 
TUniChCategory cat
 
TUniChSubCategory subCat
 
signed char script
 
int simpleUpperCaseMapping
 
int simpleLowerCaseMapping
 
int simpleTitleCaseMapping
 
int decompOffset
 
int nameOffset
 
int flags
 
int properties
 
int propertiesX
 
ushort lineBreak
 

Static Public Attributes

static const ushort LineBreak_Unknown = TUniChInfo::GetLineBreakCode('X', 'X')
 
static const ushort LineBreak_ComplexContext = TUniChInfo::GetLineBreakCode('S', 'A')
 
static const ushort LineBreak_Numeric = TUniChInfo::GetLineBreakCode('N', 'U')
 
static const ushort LineBreak_InfixNumeric = TUniChInfo::GetLineBreakCode('I', 'S')
 
static const ushort LineBreak_Quotation = TUniChInfo::GetLineBreakCode('Q', 'U')
 

Friends

class TUniChDb
 

Detailed Description

Definition at line 985 of file unicode.h.

Member Enumeration Documentation

anonymous enum
Enumerator
ccStarter 
ccOverlaysAndInterior 
ccNuktas 
ccHiraganaKatakanaVoicingMarks 
ccViramas 
ccFixedPositionStart 
ccFixedPositionEnd 
ccBelowLeftAttached 
ccBelowAttached 
ccBelowRightAttached 
ccLeftAttached 
ccRightAttached 
ccAboveLeftAttached 
ccAboveAttached 
ccAboveRightAttached 
ccBelowLeft 
ccBelow 
ccBelowRight 
ccLeft 
ccRight 
ccAboveLeft 
ccAbove 
ccAboveRight 
ccDoubleBelow 
ccDoubleAbove 
ccBelowIotaSubscript 
ccInvalid 

Definition at line 988 of file unicode.h.

988  { // combining classes (for 'combClass'); from UnicodeData.txt
989  ccStarter = 0, // 0: Spacing, split, enclosing, reordrant, and Tibetan subjoined
991  ccNuktas = 7,
993  ccViramas = 9,
994  ccFixedPositionStart = 10, // Start of fixed position classes
995  ccFixedPositionEnd = 199, // End of fixed position classes
996  ccBelowLeftAttached = 200,
997  ccBelowAttached = 202,
998  ccBelowRightAttached = 204,
999  ccLeftAttached = 208, // Left attached (reordrant around single base character)
1000  ccRightAttached = 210,
1001  ccAboveLeftAttached = 212,
1002  ccAboveAttached = 214,
1003  ccAboveRightAttached = 216,
1004  ccBelowLeft = 218,
1005  ccBelow = 220,
1006  ccBelowRight = 222,
1007  ccLeft = 224, // Left (reordrant around single base character)
1008  ccRight = 226,
1009  ccAboveLeft = 228,
1010  ccAbove = 230,
1011  ccAboveRight = 232,
1012  ccDoubleBelow = 233,
1013  ccDoubleAbove = 234,
1014  ccBelowIotaSubscript = 240, // Below (iota subscript)
1015  ccInvalid = 255 // not defined by Unicode
1016  };

Constructor & Destructor Documentation

TUniChInfo::TUniChInfo ( TSIn SIn)
inlineexplicit

Definition at line 1061 of file unicode.h.

References Load().

1061 { Load(SIn); }
void Load(TSIn &SIn)
Definition: unicode.h:1056

Here is the call graph for this function:

TUniChInfo::TUniChInfo ( )
inline

Definition at line 1062 of file unicode.h.

References InitAfterLoad().

1062  : chCat(char(ucOther)), chSubCat(char(ucOtherNotAssigned & 0xff)), combClass(ccInvalid),
1065  InitAfterLoad(); }
uchar combClass
Definition: unicode.h:1018
void InitAfterLoad()
Definition: unicode.h:1035
char chCat
Definition: unicode.h:1017
int simpleUpperCaseMapping
Definition: unicode.h:1022
int propertiesX
Definition: unicode.h:1027
int simpleTitleCaseMapping
Definition: unicode.h:1022
ushort lineBreak
Definition: unicode.h:1028
int properties
Definition: unicode.h:1026
char chSubCat
Definition: unicode.h:1017
int simpleLowerCaseMapping
Definition: unicode.h:1022
static const ushort LineBreak_Unknown
Definition: unicode.h:1032
int decompOffset
Definition: unicode.h:1023
signed char script
Definition: unicode.h:1021
int nameOffset
Definition: unicode.h:1024
int flags
Definition: unicode.h:1025

Here is the call graph for this function:

Member Function Documentation

void TUniChInfo::ClrDcpFlags ( )
inline

Definition at line 1069 of file unicode.h.

References ucfDcpMask.

1069 { flags = flags & ~ucfDcpMask; }
int flags
Definition: unicode.h:1025
void TUniChInfo::ClrWbAndSbFlags ( )
inline

Definition at line 1116 of file unicode.h.

References ucfSbMask, and ucfWbMask.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags().

1116 { flags = flags & ~(ucfWbMask | ucfSbMask); }
int flags
Definition: unicode.h:1025

Here is the caller graph for this function:

TUniChCategory TUniChInfo::GetCat ( ) const
inline

Definition at line 1145 of file unicode.h.

References cat.

1145 { return (TUniChCategory) cat; }
enum TUniChCategory_ TUniChCategory
TUniChCategory cat
Definition: unicode.h:1019
static ushort TUniChInfo::GetLineBreakCode ( char  c1,
char  c2 
)
inlinestatic

Definition at line 1031 of file unicode.h.

Referenced by TUniChDb::InitLineBreaks().

1031 { return ((static_cast<ushort>(static_cast<uchar>(c1)) & 0xff) << 8) | ((static_cast<ushort>(static_cast<uchar>(c2)) & 0xff)); }
unsigned char uchar
Definition: bd.h:10
unsigned short ushort
Definition: bd.h:13

Here is the caller graph for this function:

int TUniChInfo::GetSbFlags ( ) const
inline

Definition at line 1128 of file unicode.h.

References ucfSbMask.

Referenced by GetSbFlagsStr(), and TUniChDb::InitWordAndSentenceBoundaryFlags().

1128 { return flags & ucfSbMask; }
int flags
Definition: unicode.h:1025

Here is the caller graph for this function:

TStr TUniChInfo::GetSbFlagsStr ( ) const
inline

Definition at line 1130 of file unicode.h.

References GetSbFlags(), and GetSbFlagsStr().

Referenced by GetSbFlagsStr(), TUniChDb::InitWordAndSentenceBoundaryFlags(), and TUniChDb::TestFindNextWordOrSentenceBoundary().

1130 { return GetSbFlagsStr(GetSbFlags()); }
TStr GetSbFlagsStr() const
Definition: unicode.h:1130
int GetSbFlags() const
Definition: unicode.h:1128

Here is the call graph for this function:

Here is the caller graph for this function:

static TStr TUniChInfo::GetSbFlagsStr ( const int  flags)
inlinestatic

Definition at line 1131 of file unicode.h.

References ucfSbATerm, ucfSbClose, ucfSbFormat, ucfSbLower, ucfSbNumeric, ucfSbOLetter, ucfSbSep, ucfSbSp, ucfSbSTerm, and ucfSbUpper.

1131  { return TStr("") + (flags & ucfSbSep ? "S" : "") +
1132  (flags & ucfSbFormat ? "F" : "") + (flags & ucfSbSp ? "_" : "") + (flags & ucfSbLower ? "L" : "") +
1133  (flags & ucfSbUpper ? "U" : "") + (flags & ucfSbOLetter ? "O" : "") + (flags & ucfSbNumeric ? "N" : "") +
1134  (flags & ucfSbATerm ? "A" : "") + (flags & ucfSbSTerm ? "T" : "") + (flags & ucfSbClose ? "C" : ""); }
Definition: dt.h:412
int flags
Definition: unicode.h:1025
TUniChSubCategory TUniChInfo::GetSubCat ( ) const
inline

Definition at line 1146 of file unicode.h.

References subCat.

1146 { return (TUniChSubCategory) subCat; }
enum TUniChSubCategory_ TUniChSubCategory
TUniChSubCategory subCat
Definition: unicode.h:1020
int TUniChInfo::GetWbFlags ( ) const
inline

Definition at line 1118 of file unicode.h.

References ucfWbMask.

Referenced by GetWbFlagsStr(), and TUniChDb::InitWordAndSentenceBoundaryFlags().

1118 { return flags & ucfWbMask; }
int flags
Definition: unicode.h:1025

Here is the caller graph for this function:

TStr TUniChInfo::GetWbFlagsStr ( ) const
inline

Definition at line 1120 of file unicode.h.

References GetWbFlags(), and GetWbFlagsStr().

Referenced by GetWbFlagsStr(), and TUniChDb::TestFindNextWordOrSentenceBoundary().

1120 { return GetWbFlagsStr(GetWbFlags()); }
int GetWbFlags() const
Definition: unicode.h:1118
TStr GetWbFlagsStr() const
Definition: unicode.h:1120

Here is the call graph for this function:

Here is the caller graph for this function:

static TStr TUniChInfo::GetWbFlagsStr ( const int  flags)
inlinestatic

Definition at line 1121 of file unicode.h.

References ucfWbALetter, ucfWbExtendNumLet, ucfWbFormat, ucfWbKatakana, ucfWbMidLetter, ucfWbMidNum, and ucfWbNumeric.

1121  { return TStr("") + (flags & ucfWbALetter ? "A" : "") +
1122  (flags & ucfWbFormat ? "F" : "") + (flags & ucfWbKatakana ? "K" : "") + (flags & ucfWbMidLetter ? "M" : "") +
1123  (flags & ucfWbMidNum ? "m" : "") + (flags & ucfWbNumeric ? "N" : "") + (flags & ucfWbExtendNumLet ? "E" : ""); }
Definition: dt.h:412
int flags
Definition: unicode.h:1025
void TUniChInfo::InitAfterLoad ( )
inline

Definition at line 1035 of file unicode.h.

Referenced by Load(), TUniChDb::LoadTxt(), and TUniChInfo().

1035  {
1036  cat = (TUniChCategory) chCat;
1037  subCat = (TUniChSubCategory) (((static_cast<int>(static_cast<uchar>(chCat)) & 0xff) << 8) | (static_cast<int>(static_cast<uchar>(chSubCat)) & 0xff)); }
enum TUniChSubCategory_ TUniChSubCategory
TUniChSubCategory subCat
Definition: unicode.h:1020
enum TUniChCategory_ TUniChCategory
TUniChCategory cat
Definition: unicode.h:1019
char chCat
Definition: unicode.h:1017
char chSubCat
Definition: unicode.h:1017

Here is the caller graph for this function:

bool TUniChInfo::IsAlphabetic ( ) const
inline

Definition at line 1071 of file unicode.h.

References IsDcpFlag(), and ucfDcpAlphabetic.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags(), and TUStr::IsAlphabetic().

1071 { return IsDcpFlag(ucfDcpAlphabetic); }
bool IsDcpFlag(const TUniChFlags flag) const
Definition: unicode.h:1068

Here is the call graph for this function:

Here is the caller graph for this function:

bool TUniChInfo::IsAsciiHexDigit ( ) const
inline

Definition at line 1086 of file unicode.h.

References IsProperty(), and ucfPrAsciiHexDigit.

1086 { return IsProperty(ucfPrAsciiHexDigit); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsBidiControl ( ) const
inline

Definition at line 1087 of file unicode.h.

References IsProperty(), and ucfPrBidiControl.

1087 { return IsProperty(ucfPrBidiControl); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsCased ( ) const
inline

Definition at line 1142 of file unicode.h.

References IsLowercase(), and IsUppercase().

Referenced by TUStr::IsCase().

1142 { return IsUppercase() || IsLowercase() || (subCat == ucLetterTitlecase); }
TUniChSubCategory subCat
Definition: unicode.h:1020
bool IsUppercase() const
Definition: unicode.h:1072
bool IsLowercase() const
Definition: unicode.h:1073

Here is the call graph for this function:

Here is the caller graph for this function:

bool TUniChInfo::IsCompatibilityDecomposition ( ) const
inline

Definition at line 1112 of file unicode.h.

References ucfCompatibilityDecomposition.

Referenced by TUniChDb::AddDecomposition(), and TUniChDb::LoadTxt().

Here is the caller graph for this function:

bool TUniChInfo::IsCompositionExclusion ( ) const
inline

Definition at line 1111 of file unicode.h.

References ucfCompositionExclusion.

Referenced by TUniChDb::LoadTxt().

Here is the caller graph for this function:

bool TUniChInfo::IsCurrency ( ) const
inline

Definition at line 1157 of file unicode.h.

1157 { return subCat == ucSymbolCurrency; }
TUniChSubCategory subCat
Definition: unicode.h:1020
bool TUniChInfo::IsDash ( ) const
inline

Definition at line 1088 of file unicode.h.

References IsProperty(), and ucfPrDash.

1088 { return IsProperty(ucfPrDash); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsDcpFlag ( const TUniChFlags  flag) const
inline

Definition at line 1068 of file unicode.h.

References Assert, and ucfDcpMask.

Referenced by TUniChDb::InitDerivedCoreProperties(), IsAlphabetic(), IsDefaultIgnorable(), IsGraphemeBase(), IsGraphemeExtend(), IsIdContinue(), IsIdStart(), IsLowercase(), IsMath(), IsUppercase(), IsXidContinue(), and IsXidStart().

1068 { Assert((flag & ucfDcpMask) == flag); return (flags & flag) == flag; }
#define Assert(Cond)
Definition: bd.h:251
int flags
Definition: unicode.h:1025

Here is the caller graph for this function:

bool TUniChInfo::IsDefaultIgnorable ( ) const
inline

Definition at line 1075 of file unicode.h.

References IsDcpFlag(), and ucfDcpDefaultIgnorableCodePoint.

bool IsDcpFlag(const TUniChFlags flag) const
Definition: unicode.h:1068

Here is the call graph for this function:

bool TUniChInfo::IsDeprecated ( ) const
inline

Definition at line 1089 of file unicode.h.

References IsProperty(), and ucfPrDeprecated.

1089 { return IsProperty(ucfPrDeprecated); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsDiacritic ( ) const
inline

Definition at line 1090 of file unicode.h.

References IsProperty(), and ucfPrDiacritic.

1090 { return IsProperty(ucfPrDiacritic); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsExtender ( ) const
inline

Definition at line 1091 of file unicode.h.

References IsProperty(), and ucfPrExtender.

1091 { return IsProperty(ucfPrExtender); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsGbExtend ( ) const
inline

Definition at line 1139 of file unicode.h.

References IsGraphemeExtend().

Referenced by TUniChDb::IsWbIgnored().

1139 { return IsGraphemeExtend(); }
bool IsGraphemeExtend() const
Definition: unicode.h:1077

Here is the call graph for this function:

Here is the caller graph for this function:

bool TUniChInfo::IsGraphemeBase ( ) const
inline

Definition at line 1076 of file unicode.h.

References IsDcpFlag(), and ucfDcpGraphemeBase.

1076 { return IsDcpFlag(ucfDcpGraphemeBase); }
bool IsDcpFlag(const TUniChFlags flag) const
Definition: unicode.h:1068

Here is the call graph for this function:

bool TUniChInfo::IsGraphemeExtend ( ) const
inline

Definition at line 1077 of file unicode.h.

References IsDcpFlag(), and ucfDcpGraphemeExtend.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags(), and IsGbExtend().

1077 { return IsDcpFlag(ucfDcpGraphemeExtend); }
bool IsDcpFlag(const TUniChFlags flag) const
Definition: unicode.h:1068

Here is the call graph for this function:

Here is the caller graph for this function:

bool TUniChInfo::IsGraphemeLink ( ) const
inline

Definition at line 1092 of file unicode.h.

References IsProperty(), and ucfPrGraphemeLink.

1092 { return IsProperty(ucfPrGraphemeLink); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsHexDigit ( ) const
inline

Definition at line 1093 of file unicode.h.

References IsProperty(), and ucfPrHexDigit.

1093 { return IsProperty(ucfPrHexDigit); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsHyphen ( ) const
inline

Definition at line 1094 of file unicode.h.

References IsProperty(), and ucfPrHyphen.

1094 { return IsProperty(ucfPrHyphen); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsIdContinue ( ) const
inline

Definition at line 1079 of file unicode.h.

References IsDcpFlag(), and ucfDcpIdContinue.

1079 { return IsDcpFlag(ucfDcpIdContinue); }
bool IsDcpFlag(const TUniChFlags flag) const
Definition: unicode.h:1068

Here is the call graph for this function:

bool TUniChInfo::IsIdeographic ( ) const
inline

Definition at line 1095 of file unicode.h.

References IsProperty(), and ucfPrIdeographic.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags().

1095 { return IsProperty(ucfPrIdeographic); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

Here is the caller graph for this function:

bool TUniChInfo::IsIdStart ( ) const
inline

Definition at line 1078 of file unicode.h.

References IsDcpFlag(), and ucfDcpIdStart.

1078 { return IsDcpFlag(ucfDcpIdStart); }
bool IsDcpFlag(const TUniChFlags flag) const
Definition: unicode.h:1068

Here is the call graph for this function:

bool TUniChInfo::IsJoinControl ( ) const
inline

Definition at line 1096 of file unicode.h.

References IsProperty(), and ucfPrJoinControl.

1096 { return IsProperty(ucfPrJoinControl); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsLogicalOrderException ( ) const
inline

Definition at line 1097 of file unicode.h.

References IsProperty(), and ucfPrLogicalOrderException.

bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsLowercase ( ) const
inline

Definition at line 1073 of file unicode.h.

References IsDcpFlag(), and ucfDcpLowercase.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags(), IsCased(), and TUStr::IsLowerCase().

1073 { return IsDcpFlag(ucfDcpLowercase); }
bool IsDcpFlag(const TUniChFlags flag) const
Definition: unicode.h:1068

Here is the call graph for this function:

Here is the caller graph for this function:

bool TUniChInfo::IsMath ( ) const
inline

Definition at line 1074 of file unicode.h.

References IsDcpFlag(), and ucfDcpMath.

Referenced by TUStr::IsMath().

1074 { return IsDcpFlag(ucfDcpMath); }
bool IsDcpFlag(const TUniChFlags flag) const
Definition: unicode.h:1068

Here is the call graph for this function:

Here is the caller graph for this function:

bool TUniChInfo::IsNoncharacter ( ) const
inline

Definition at line 1098 of file unicode.h.

References IsProperty(), and ucfPrNoncharacterCodePoint.

bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsPrivateUse ( ) const
inline

Definition at line 1161 of file unicode.h.

1161 { return subCat == ucOtherPrivateUse; }
TUniChSubCategory subCat
Definition: unicode.h:1020
bool TUniChInfo::IsPropertyX ( const TUniChPropertiesX  flag) const
inline

Definition at line 1107 of file unicode.h.

Referenced by TUniChDb::InitPropList().

1107 { return (propertiesX & flag) == flag; }
int propertiesX
Definition: unicode.h:1027

Here is the caller graph for this function:

bool TUniChInfo::IsQuotationMark ( ) const
inline

Definition at line 1099 of file unicode.h.

References IsProperty(), and ucfPrQuotationMark.

1099 { return IsProperty(ucfPrQuotationMark); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsSbFlag ( const TUniChFlags  flag) const
inline

Definition at line 1126 of file unicode.h.

References Assert, and ucfSbMask.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags(), and IsSbFormat().

1126 { Assert((flag & ucfSbMask) == flag); return (flags & flag) == flag; }
#define Assert(Cond)
Definition: bd.h:251
int flags
Definition: unicode.h:1025

Here is the caller graph for this function:

bool TUniChInfo::IsSbFormat ( ) const
inline

Definition at line 1129 of file unicode.h.

References IsSbFlag(), and ucfSbFormat.

1129 { return IsSbFlag(ucfSbFormat); }
bool IsSbFlag(const TUniChFlags flag) const
Definition: unicode.h:1126

Here is the call graph for this function:

bool TUniChInfo::IsSbSep ( ) const
inline

Definition at line 1136 of file unicode.h.

References ucfSbSep.

1136 { return (flags & ucfSbSep) == ucfSbSep; }
int flags
Definition: unicode.h:1025
bool TUniChInfo::IsSoftDotted ( ) const
inline

Definition at line 1100 of file unicode.h.

References IsProperty(), and ucfPrSoftDotted.

1100 { return IsProperty(ucfPrSoftDotted); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsSTerminal ( ) const
inline

Definition at line 1101 of file unicode.h.

References IsProperty(), and ucfPrSTerm.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags().

1101 { return IsProperty(ucfPrSTerm); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

Here is the caller graph for this function:

bool TUniChInfo::IsSurrogate ( ) const
inline

Definition at line 1162 of file unicode.h.

1162 { return subCat == ucOtherSurrogate; }
TUniChSubCategory subCat
Definition: unicode.h:1020
bool TUniChInfo::IsTerminalPunctuation ( ) const
inline

Definition at line 1102 of file unicode.h.

References IsProperty(), and ucfPrTerminalPunctuation.

bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsUppercase ( ) const
inline

Definition at line 1072 of file unicode.h.

References IsDcpFlag(), and ucfDcpUppercase.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags(), IsCased(), and TUStr::IsUpperCase().

1072 { return IsDcpFlag(ucfDcpUppercase); }
bool IsDcpFlag(const TUniChFlags flag) const
Definition: unicode.h:1068

Here is the call graph for this function:

Here is the caller graph for this function:

static bool TUniChInfo::IsValidSubCat ( const char  chCat,
const char  chSubCat 
)
inlinestatic

Definition at line 1164 of file unicode.h.

Referenced by TUniChDb::TSubcatHelper::ProcessComment().

1164  {
1165  static const char s[] = "LuLlLtLmLoMnMcMeNdNlNoPcPdPsPePiPfPoSmScSkSoZsZlZpCcCfCsCoCn";
1166  for (const char *p = s; *p; p += 2)
1167  if (chCat == p[0] && chSubCat == p[1]) return true;
1168  return false; }
char chCat
Definition: unicode.h:1017
char chSubCat
Definition: unicode.h:1017

Here is the caller graph for this function:

bool TUniChInfo::IsVariationSelector ( ) const
inline

Definition at line 1103 of file unicode.h.

References IsProperty(), and ucfPrVariationSelector.

bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

bool TUniChInfo::IsWbFlag ( const TUniChFlags  flag) const
inline

Definition at line 1115 of file unicode.h.

References Assert, and ucfWbMask.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags(), and IsWbFormat().

1115 { Assert((flag & ucfWbMask) == flag); return (flags & flag) == flag; }
#define Assert(Cond)
Definition: bd.h:251
int flags
Definition: unicode.h:1025

Here is the caller graph for this function:

bool TUniChInfo::IsWbFormat ( ) const
inline

Definition at line 1119 of file unicode.h.

References IsWbFlag(), and ucfWbFormat.

Referenced by TUniChDb::IsWbIgnored().

1119 { return IsWbFlag(ucfWbFormat); }
bool IsWbFlag(const TUniChFlags flag) const
Definition: unicode.h:1115

Here is the call graph for this function:

Here is the caller graph for this function:

bool TUniChInfo::IsWhiteSpace ( ) const
inline

Definition at line 1104 of file unicode.h.

References IsProperty(), and ucfPrWhiteSpace.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags().

1104 { return IsProperty(ucfPrWhiteSpace); }
bool IsProperty(const TUniChProperties flag) const
Definition: unicode.h:1084

Here is the call graph for this function:

Here is the caller graph for this function:

bool TUniChInfo::IsXidContinue ( ) const
inline

Definition at line 1081 of file unicode.h.

References IsDcpFlag(), and ucfDcpXidContinue.

1081 { return IsDcpFlag(ucfDcpXidContinue); }
bool IsDcpFlag(const TUniChFlags flag) const
Definition: unicode.h:1068

Here is the call graph for this function:

bool TUniChInfo::IsXidStart ( ) const
inline

Definition at line 1080 of file unicode.h.

References IsDcpFlag(), and ucfDcpXidStart.

1080 { return IsDcpFlag(ucfDcpXidStart); }
bool IsDcpFlag(const TUniChFlags flag) const
Definition: unicode.h:1068

Here is the call graph for this function:

void TUniChInfo::Load ( TSIn SIn)
inline

Definition at line 1056 of file unicode.h.

References InitAfterLoad(), TSIn::Load(), LoadSChar(), and LoadUShort().

Referenced by TUniChInfo().

1056  {
1057  SIn.Load(chCat); SIn.Load(chSubCat); SIn.Load(combClass); LoadSChar(SIn, script);
1059  SIn.Load(decompOffset); SIn.Load(nameOffset);
uchar combClass
Definition: unicode.h:1018
void InitAfterLoad()
Definition: unicode.h:1035
char chCat
Definition: unicode.h:1017
int simpleUpperCaseMapping
Definition: unicode.h:1022
static void LoadUShort(TSIn &SIn, ushort &u)
Definition: unicode.h:1045
int propertiesX
Definition: unicode.h:1027
int simpleTitleCaseMapping
Definition: unicode.h:1022
ushort lineBreak
Definition: unicode.h:1028
void Load(bool &Bool)
Definition: fl.h:84
static void LoadSChar(TSIn &SIn, signed char &u)
Definition: unicode.h:1046
int properties
Definition: unicode.h:1026
char chSubCat
Definition: unicode.h:1017
int simpleLowerCaseMapping
Definition: unicode.h:1022
int decompOffset
Definition: unicode.h:1023
signed char script
Definition: unicode.h:1021
int nameOffset
Definition: unicode.h:1024
int flags
Definition: unicode.h:1025

Here is the call graph for this function:

Here is the caller graph for this function:

static void TUniChInfo::LoadSChar ( TSIn SIn,
signed char &  u 
)
inlinestatic

Definition at line 1046 of file unicode.h.

References TSIn::LoadBf().

Referenced by Load().

1046 { SIn.LoadBf(&u, sizeof(u)); }
void LoadBf(const void *Bf, const TSize &BfL)
Definition: fl.h:81

Here is the call graph for this function:

Here is the caller graph for this function:

static void TUniChInfo::LoadUShort ( TSIn SIn,
ushort u 
)
inlinestatic

Definition at line 1045 of file unicode.h.

References TSIn::LoadBf().

Referenced by Load().

1045 { SIn.LoadBf(&u, sizeof(u)); }
void LoadBf(const void *Bf, const TSize &BfL)
Definition: fl.h:81

Here is the call graph for this function:

Here is the caller graph for this function:

void TUniChInfo::Save ( TSOut SOut) const
inline

Definition at line 1051 of file unicode.h.

References TSOut::Save(), SaveSChar(), and SaveUShort().

1051  {
1052  SOut.Save(chCat); SOut.Save(chSubCat); SOut.Save(combClass); SaveSChar(SOut, script);
1054  SOut.Save(decompOffset); SOut.Save(nameOffset);
1055  SOut.Save(flags); SOut.Save(properties); SOut.Save(propertiesX); SaveUShort(SOut, lineBreak); }
uchar combClass
Definition: unicode.h:1018
char chCat
Definition: unicode.h:1017
static void SaveUShort(TSOut &SOut, ushort u)
Definition: unicode.h:1047
int simpleUpperCaseMapping
Definition: unicode.h:1022
int propertiesX
Definition: unicode.h:1027
int simpleTitleCaseMapping
Definition: unicode.h:1022
ushort lineBreak
Definition: unicode.h:1028
int properties
Definition: unicode.h:1026
void Save(const bool &Bool)
Definition: fl.h:173
char chSubCat
Definition: unicode.h:1017
int simpleLowerCaseMapping
Definition: unicode.h:1022
int decompOffset
Definition: unicode.h:1023
signed char script
Definition: unicode.h:1021
int nameOffset
Definition: unicode.h:1024
static void SaveSChar(TSOut &SOut, signed char u)
Definition: unicode.h:1048
int flags
Definition: unicode.h:1025

Here is the call graph for this function:

static void TUniChInfo::SaveSChar ( TSOut SOut,
signed char  u 
)
inlinestatic

Definition at line 1048 of file unicode.h.

References TSOut::SaveBf().

Referenced by Save().

1048 { SOut.SaveBf(&u, sizeof(u)); }
void SaveBf(const void *Bf, const TSize &BfL)
Definition: fl.h:172

Here is the call graph for this function:

Here is the caller graph for this function:

static void TUniChInfo::SaveUShort ( TSOut SOut,
ushort  u 
)
inlinestatic

Definition at line 1047 of file unicode.h.

References TSOut::SaveBf().

Referenced by Save().

1047 { SOut.SaveBf(&u, sizeof(u)); }
void SaveBf(const void *Bf, const TSize &BfL)
Definition: fl.h:172

Here is the call graph for this function:

Here is the caller graph for this function:

void TUniChInfo::SetCatAndSubCat ( const TUniChSubCategory  catAndSubCat)
inline

Definition at line 1038 of file unicode.h.

1038  {
1039  cat = (TUniChCategory) ((int(catAndSubCat) >> 8) & 0xff);
1040  subCat = catAndSubCat;
1041  chCat = (char) cat; chSubCat = (char) (int(subCat) & 0xff); }
TUniChSubCategory subCat
Definition: unicode.h:1020
enum TUniChCategory_ TUniChCategory
TUniChCategory cat
Definition: unicode.h:1019
char chCat
Definition: unicode.h:1017
char chSubCat
Definition: unicode.h:1017
void TUniChInfo::SetDcpFlag ( const TUniChFlags  flag)
inline

Definition at line 1070 of file unicode.h.

References Assert, and ucfDcpMask.

Referenced by TUniChDb::InitDerivedCoreProperties().

1070 { Assert((flag & ucfDcpMask) == flag); flags |= flag; }
#define Assert(Cond)
Definition: bd.h:251
int flags
Definition: unicode.h:1025

Here is the caller graph for this function:

void TUniChInfo::SetProperty ( const TUniChProperties  flag)
inline

Definition at line 1085 of file unicode.h.

Referenced by TUniChDb::InitPropList().

1085 { properties |= flag; }
int properties
Definition: unicode.h:1026

Here is the caller graph for this function:

void TUniChInfo::SetPropertyX ( const TUniChPropertiesX  flag)
inline

Definition at line 1108 of file unicode.h.

Referenced by TUniChDb::InitPropList().

1108 { propertiesX |= flag; }
int propertiesX
Definition: unicode.h:1027

Here is the caller graph for this function:

void TUniChInfo::SetSbFlag ( const TUniChFlags  flag)
inline

Definition at line 1127 of file unicode.h.

References Assert, and ucfSbMask.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags().

1127 { Assert((flag & ucfSbMask) == flag); flags |= flag; }
#define Assert(Cond)
Definition: bd.h:251
int flags
Definition: unicode.h:1025

Here is the caller graph for this function:

void TUniChInfo::SetWbFlag ( const TUniChFlags  flag)
inline

Definition at line 1117 of file unicode.h.

References Assert, and ucfWbMask.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags().

1117 { Assert((flag & ucfWbMask) == flag); flags |= flag; }
#define Assert(Cond)
Definition: bd.h:251
int flags
Definition: unicode.h:1025

Here is the caller graph for this function:

Friends And Related Function Documentation

friend class TUniChDb
friend

Definition at line 1042 of file unicode.h.

Member Data Documentation

TUniChCategory TUniChInfo::cat

Definition at line 1019 of file unicode.h.

Referenced by GetCat().

char TUniChInfo::chCat

Definition at line 1017 of file unicode.h.

Referenced by TUniChDb::LoadTxt().

char TUniChInfo::chSubCat

Definition at line 1017 of file unicode.h.

Referenced by TUniChDb::LoadTxt().

uchar TUniChInfo::combClass

Definition at line 1018 of file unicode.h.

Referenced by TUniChDb::LoadTxt().

int TUniChInfo::decompOffset
int TUniChInfo::flags
ushort TUniChInfo::lineBreak

Definition at line 1028 of file unicode.h.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags().

const ushort TUniChInfo::LineBreak_ComplexContext = TUniChInfo::GetLineBreakCode('S', 'A')
static

Definition at line 1032 of file unicode.h.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags().

const ushort TUniChInfo::LineBreak_InfixNumeric = TUniChInfo::GetLineBreakCode('I', 'S')
static

Definition at line 1032 of file unicode.h.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags().

const ushort TUniChInfo::LineBreak_Numeric = TUniChInfo::GetLineBreakCode('N', 'U')
static

Definition at line 1032 of file unicode.h.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags().

const ushort TUniChInfo::LineBreak_Quotation = TUniChInfo::GetLineBreakCode('Q', 'U')
static

Definition at line 1032 of file unicode.h.

Referenced by TUniChDb::InitWordAndSentenceBoundaryFlags().

const ushort TUniChInfo::LineBreak_Unknown = TUniChInfo::GetLineBreakCode('X', 'X')
static

Definition at line 1032 of file unicode.h.

Referenced by TUniChDb::InitLineBreaks().

int TUniChInfo::nameOffset

Definition at line 1024 of file unicode.h.

Referenced by TUniChDb::LoadTxt().

int TUniChInfo::properties

Definition at line 1026 of file unicode.h.

Referenced by TUniChDb::TestWbFindNonIgnored().

int TUniChInfo::propertiesX

Definition at line 1027 of file unicode.h.

Referenced by TUniChDb::TestWbFindNonIgnored().

int TUniChInfo::simpleLowerCaseMapping
int TUniChInfo::simpleTitleCaseMapping
int TUniChInfo::simpleUpperCaseMapping
TUniChSubCategory TUniChInfo::subCat

Definition at line 1020 of file unicode.h.

Referenced by GetSubCat(), and TUniChDb::InitWordAndSentenceBoundaryFlags().


The documentation for this class was generated from the following files: