SNAP Library, User Reference
2012-10-02 12:56:23
SNAP, a general purpose network analysis and graph mining library
|
Static Public Member Functions | |
static TChA & | GetXmlTagVal (TXmlLx &XmlLx, const TChA &TagNm) |
static void | GetXmlTagNmVal (TXmlLx &XmlLx, TChA &TagNm, TChA &TagVal) |
static bool | GetXmlTagNmVal2 (TXmlLx &XmlLx, TChA &TagNm, TChA &TagVal, const bool &TakeTagNms) |
static TChA | GetDomNm (const TChA &UrlChA) |
static TChA | GetDomNm2 (const TChA &UrlChA) |
static TChA | GetWebsiteNm (const TChA &UrlChA) |
static bool | GetNormalizedUrl (const TChA &UrlIn, const TChA &BaseUrl, TChA &UrlOut) |
Quick URL nomalization: Remove ending /, /index.html, etc. and strip starting www. | |
static bool | StripEnd (const TChA &Str, const TChA &SearchStr, TChA &NewStr) |
static TChA | GetShorStr (const TChA &LongStr, const int MaxLen=50) |
static TChA | GetCleanStr (const TChA &ChA) |
static TChA | GetCleanWrdStr (const TChA &ChA) |
static int | CountWords (const char *CStr) |
static int | CountWords (const TChA &ChA) |
static int | CountWords (const TChA &ChA, const TStrHash< TInt > &StopWordH) |
static int | SplitWords (TChA &ChA, TVec< char * > &WrdV, const bool &SplitOnWs=true) |
static int | SplitOnCh (TChA &ChA, TVec< char * > &WrdV, const char &Ch, const bool &SkipEmpty=false) |
static int | SplitLines (TChA &ChA, TVec< char * > &LineV, const bool &SkipEmpty=false) |
static int | SplitSentences (TChA &ChA, TVec< char * > &SentenceV) |
static void | RemoveHtmlTags (const TChA &HtmlStr, TChA &TextStr) |
static bool | IsLatinStr (const TChA &Str, const double &MinAlFrac) |
static void | GetWIdV (const TStrHash< TInt > &StrH, const char *CStr, TIntV &WIdV) |
static void | GetAddWIdV (TStrHash< TInt > &StrH, const char *CStr, TIntV &WIdV) |
static bool | GetTmFromStr (const char *TmStr, TSecTm &Tm) |
Parses time in many different text formats. See source code for details. | |
static TStr | GetStdName (TStr AuthorName) |
Puts person's name (fist middle last) in a standard form: <last_name>_<first name innitial> | |
static void | GetStdNameV (TStr AuthorNames, TStrV &StdNameV) |
Splits a list of people's names. |
String helper functions and utilities. Quick and ditry!
int TStrUtil::CountWords | ( | const char * | CStr | ) | [static] |
int TStrUtil::CountWords | ( | const TChA & | ChA | ) | [static] |
int TStrUtil::CountWords | ( | const TChA & | ChA, |
const TStrHash< TInt > & | StopWordH | ||
) | [static] |
void TStrUtil::GetAddWIdV | ( | TStrHash< TInt > & | StrH, |
const char * | CStr, | ||
TIntV & | WIdV | ||
) | [static] |
TChA TStrUtil::GetCleanStr | ( | const TChA & | ChA | ) | [static] |
TChA TStrUtil::GetCleanWrdStr | ( | const TChA & | ChA | ) | [static] |
TChA TStrUtil::GetDomNm | ( | const TChA & | UrlChA | ) | [static] |
TChA TStrUtil::GetDomNm2 | ( | const TChA & | UrlChA | ) | [static] |
bool TStrUtil::GetNormalizedUrl | ( | const TChA & | UrlIn, |
const TChA & | BaseUrl, | ||
TChA & | UrlOut | ||
) | [static] |
Quick URL nomalization: Remove ending /, /index.html, etc. and strip starting www.
TChA TStrUtil::GetShorStr | ( | const TChA & | LongStr, |
const int | MaxLen = 50 |
||
) | [static] |
TStr TStrUtil::GetStdName | ( | TStr | AuthorName | ) | [static] |
Puts person's name (fist middle last) in a standard form: <last_name>_<first name innitial>
void TStrUtil::GetStdNameV | ( | TStr | AuthorNames, |
TStrV & | StdNameV | ||
) | [static] |
Splits a list of people's names.
bool TStrUtil::GetTmFromStr | ( | const char * | TmStr, |
TSecTm & | Tm | ||
) | [static] |
Parses time in many different text formats. See source code for details.
TChA TStrUtil::GetWebsiteNm | ( | const TChA & | UrlChA | ) | [static] |
void TStrUtil::GetWIdV | ( | const TStrHash< TInt > & | StrH, |
const char * | CStr, | ||
TIntV & | WIdV | ||
) | [static] |
void TStrUtil::GetXmlTagNmVal | ( | TXmlLx & | XmlLx, |
TChA & | TagNm, | ||
TChA & | TagVal | ||
) | [static] |
bool TStrUtil::GetXmlTagNmVal2 | ( | TXmlLx & | XmlLx, |
TChA & | TagNm, | ||
TChA & | TagVal, | ||
const bool & | TakeTagNms | ||
) | [static] |
TChA & TStrUtil::GetXmlTagVal | ( | TXmlLx & | XmlLx, |
const TChA & | TagNm | ||
) | [static] |
bool TStrUtil::IsLatinStr | ( | const TChA & | Str, |
const double & | MinAlFrac | ||
) | [static] |
void TStrUtil::RemoveHtmlTags | ( | const TChA & | HtmlStr, |
TChA & | TextStr | ||
) | [static] |
int TStrUtil::SplitLines | ( | TChA & | ChA, |
TVec< char * > & | LineV, | ||
const bool & | SkipEmpty = false |
||
) | [static] |
int TStrUtil::SplitOnCh | ( | TChA & | ChA, |
TVec< char * > & | WrdV, | ||
const char & | Ch, | ||
const bool & | SkipEmpty = false |
||
) | [static] |
int TStrUtil::SplitSentences | ( | TChA & | ChA, |
TVec< char * > & | SentenceV | ||
) | [static] |
int TStrUtil::SplitWords | ( | TChA & | ChA, |
TVec< char * > & | WrdV, | ||
const bool & | SplitOnWs = true |
||
) | [static] |
bool TStrUtil::StripEnd | ( | const TChA & | Str, |
const TChA & | SearchStr, | ||
TChA & | NewStr | ||
) | [static] |