SNAP Library 6.0, Developer Reference
2020-12-09 16:24:20
SNAP, a general purpose, high performance system for analysis and manipulation of large networks
|
#include <html.h>
Public Types | |
typedef TStrKdV | TArgNmValV |
Public Member Functions | |
THtmlLx (const PSIn &_SIn, const bool &_DoParseArg=true) | |
THtmlLx & | operator= (const THtmlLx &) |
void | PutCh (const char &_Ch) |
void | PutStr (const TStr &Str) |
THtmlLxSym | GetSym () |
PHtmlTok | GetTok (const bool &DoUc=true) |
TStr | GetPreSpaceStr () const |
int | GetArgs () const |
TStr | GetArgNm (const int &ArgN) const |
TStr | GetArgVal (const int &ArgN) const |
bool | IsArg (const TStr &ArgNm) const |
TStr | GetArg (const TStr &ArgNm, const TStr &DfArgVal=TStr()) const |
void | PutArg (const TStr &ArgNm, const TStr &ArgVal) |
TStr | GetFullBTagStr () const |
void | MoveToStrOrEof (const TStr &Str) |
void | MoveToBTagOrEof (const TStr &TagNm) |
void | MoveToBTag2OrEof (const TStr &TagNm1, const TStr &TagNm2) |
void | MoveToBTag3OrEof (const TStr &TagNm1, const TStr &TagNm2, const TStr &TagNm3) |
void | MoveToBTagOrETagOrEof (const TStr &BTagNm, const TStr &ETagNm) |
void | MoveToBTagArgOrEof (const TStr &TagNm, const TStr &ArgNm, const TStr &ArgVal) |
void | MoveToBTagArg2OrEof (const TStr &TagNm, const TStr &ArgNm1, const TStr &ArgVal1, const TStr &ArgNm2, const TStr &ArgVal2, const bool &AndOpP=true) |
void | MoveToBTagOrEof (const TStr &TagNm1, const TStr &ArgNm1, const TStr &ArgVal1, const TStr &TagNm2, const TStr &ArgNm2, const TStr &ArgVal2) |
void | MoveToETagOrEof (const TStr &TagNm) |
TStr | GetTextOnlyStrToEof () |
TStr | GetStrToBTag (const TStr &TagNm, const bool &TxtOnlyP=false) |
TStr | GetStrToBTag (const TStr &TagNm, const TStr &ArgNm, const TStr &ArgVal, const bool &TxtOnlyP=false) |
TStr | GetStrToETag (const TStr &TagNm, const bool &TxtOnlyP=false) |
TStr | GetStrToETag2 (const TStr &TagNm1, const TStr &TagNm2, const bool &TxtOnlyP=false) |
TStr | GetStrInTag (const TStr &TagNm, const bool &TxtOnlyP=false) |
TStr | GetHRefBeforeStr (const TStr &Str) |
bool | IsGetBTag (const TStr &TagNm) |
bool | IsGetETag (const TStr &TagNm) |
Static Public Member Functions | |
static TStr | GetSymStr (const THtmlLxSym &Sym) |
static TStr | GetEscapedStr (const TChA &ChA) |
static TStr | GetAsciiStr (const TChA &ChA, const char &GenericCh='_') |
static void | GetTokStrV (const TStr &Str, TStrV &TokStrV) |
static TStr | GetNoTag (const TStr &Str) |
Public Attributes | |
THtmlLxSym | Sym |
int | SymBChX |
int | SymEChX |
TChA | ChA |
TChA | UcChA |
TChA | SymChA |
int | PreSpaces |
TChA | PreSpaceChA |
TArgNmValV | ArgNmValV |
Private Member Functions | |
void | GetCh () |
void | GetEscCh () |
void | GetMetaTag () |
void | GetTag () |
Private Attributes | |
PSIn | SIn |
TSIn & | RSIn |
bool | DoParseArg |
TChA | ChStack |
char | Ch |
int | ChX |
bool | EscCh |
TChA | EscChA |
TChA | ArgNm |
TChA | ArgVal |
Static Private Attributes | |
static THtmlLxChDef | ChDef |
typedef TStrKdV THtmlLx::TArgNmValV |
|
inline |
Definition at line 139 of file html.h.
References TVec< TVal, TSizeTy >::SearchForw().
Referenced by THtmlDoc::_IsTagRedir(), GetHRefBeforeStr(), GetStrToBTag(), MoveToBTagArg2OrEof(), MoveToBTagArgOrEof(), and MoveToBTagOrEof().
|
inline |
Definition at line 136 of file html.h.
Referenced by GetFullBTagStr(), and THtmlDoc::SaveHtmlToXml().
|
inline |
Definition at line 135 of file html.h.
References TVec< TVal, TSizeTy >::Len().
Referenced by GetFullBTagStr(), and THtmlDoc::SaveHtmlToXml().
|
inline |
Definition at line 137 of file html.h.
Referenced by GetFullBTagStr(), and THtmlDoc::SaveHtmlToXml().
Definition at line 584 of file html.cpp.
References Ch, and TChA::Len().
|
inlineprivate |
Definition at line 95 of file html.h.
References Ch, TChA::Empty(), TSIn::Eof(), TCh::EofCh, TSIn::GetCh(), TChA::Pop(), and SymChA.
Referenced by GetEscCh(), GetMetaTag(), GetSym(), and GetTag().
Definition at line 568 of file html.cpp.
References Ch, and TChA::Len().
|
private |
Definition at line 195 of file html.cpp.
References TChA::AddCh(), Ch, ChDef, TChA::Clr(), EscCh, EscChA, GetCh(), THtmlLxChDef::GetEscStr(), PutCh(), and PutStr().
Referenced by GetMetaTag(), GetSym(), and GetTag().
TStr THtmlLx::GetFullBTagStr | ( | ) | const |
Definition at line 358 of file html.cpp.
References ChA, GetArgNm(), GetArgs(), GetArgVal(), hsyBTag, IAssert, TChA::Pop(), and Sym.
Referenced by THtmlDoc::GetRedirHtmlDocStr().
|
private |
Definition at line 225 of file html.cpp.
References Ch, TCh::EofCh, GetCh(), GetEscCh(), hsyMTag, and Sym.
Referenced by GetSym().
|
inline |
Definition at line 132 of file html.h.
References TStr::GetSpaceStr().
Definition at line 525 of file html.cpp.
References GetStrToETag(), and MoveToBTagOrEof().
TStr THtmlLx::GetStrToBTag | ( | const TStr & | TagNm, |
const TStr & | ArgNm, | ||
const TStr & | ArgVal, | ||
const bool & | TxtOnlyP = false |
||
) |
TStr THtmlLx::GetStrToETag2 | ( | const TStr & | TagNm1, |
const TStr & | TagNm2, | ||
const bool & | TxtOnlyP = false |
||
) |
THtmlLxSym THtmlLx::GetSym | ( | ) |
Definition at line 277 of file html.cpp.
References TChA::AddCh(), ArgNmValV, Ch, ChA, ChDef, ChX, TChA::Clr(), TVec< TVal, TSizeTy >::Clr(), TChA::Empty(), EscCh, forever, GetCh(), THtmlLxChDef::GetChTy(), GetEscCh(), GetMetaTag(), GetTag(), THtmlLxChDef::GetUc(), hlctAlpha, hlctEof, hlctLTag, hlctNum, hlctRTag, hlctSym, hsyEof, hsyNum, hsySSym, hsyStr, hsyUndef, THtmlLxChDef::IsAlNum(), THtmlLxChDef::IsAlpha(), THtmlLxChDef::IsNum(), THtmlLxChDef::IsSpace(), TChA::LastCh(), TChA::Pop(), PreSpaceChA, PreSpaces, PutCh(), Sym, SymBChX, SymChA, SymEChX, and UcChA.
Referenced by GetHRefBeforeStr(), GetNoTag(), THtmlDoc::GetRedirHtmlDocStr(), GetStrToBTag(), GetStrToETag(), GetStrToETag2(), GetTextOnlyStrToEof(), GetTokStrV(), THtmlDoc::GetTxtLnDoc(), IsGetBTag(), IsGetETag(), MoveToBTag2OrEof(), MoveToBTag3OrEof(), MoveToBTagArg2OrEof(), MoveToBTagArgOrEof(), MoveToBTagOrEof(), MoveToBTagOrETagOrEof(), MoveToETagOrEof(), MoveToStrOrEof(), THtmlDoc::SaveHtmlToXml(), and THtmlDoc::THtmlDoc().
|
static |
|
private |
Definition at line 236 of file html.cpp.
References TVec< TVal, TSizeTy >::Add(), TChA::AddCh(), ArgNm, ArgNmValV, ArgVal, Ch, ChA, ChDef, TChA::Clr(), DoParseArg, TCh::EofCh, GetCh(), GetEscCh(), THtmlLxChDef::GetUc(), hsyBTag, hsyETag, THtmlLxChDef::IsAlNum(), THtmlLxChDef::IsAlpha(), THtmlLxChDef::IsEoln(), THtmlLxChDef::IsWs(), Sym, and UcChA.
Referenced by GetSym().
TStr THtmlLx::GetTextOnlyStrToEof | ( | ) |
PHtmlTok THtmlLx::GetTok | ( | const bool & | DoUc = true | ) |
Definition at line 353 of file html.cpp.
References ArgNmValV, ChA, Sym, and UcChA.
Referenced by THtmlDoc::GetTxtLnDoc(), THtmlDoc::SaveHtmlToXml(), and THtmlDoc::THtmlDoc().
Definition at line 595 of file html.cpp.
References TVec< TVal, TSizeTy >::Add(), ChA, TVec< TVal, TSizeTy >::Clr(), GetSym(), hsyEof, TStrIn::New(), SIn, and Sym.
|
inline |
Definition at line 138 of file html.h.
References TVec< TVal, TSizeTy >::IsIn().
Referenced by THtmlDoc::_IsTagRedir(), GetStrToBTag(), MoveToBTagArg2OrEof(), MoveToBTagArgOrEof(), and MoveToBTagOrEof().
bool THtmlLx::IsGetBTag | ( | const TStr & | TagNm | ) |
bool THtmlLx::IsGetETag | ( | const TStr & | TagNm | ) |
void THtmlLx::MoveToBTagArg2OrEof | ( | const TStr & | TagNm, |
const TStr & | ArgNm1, | ||
const TStr & | ArgVal1, | ||
const TStr & | ArgNm2, | ||
const TStr & | ArgVal2, | ||
const bool & | AndOpP = true |
||
) |
void THtmlLx::MoveToBTagOrEof | ( | const TStr & | TagNm | ) |
void THtmlLx::MoveToBTagOrEof | ( | const TStr & | TagNm1, |
const TStr & | ArgNm1, | ||
const TStr & | ArgVal1, | ||
const TStr & | TagNm2, | ||
const TStr & | ArgNm2, | ||
const TStr & | ArgVal2 | ||
) |
void THtmlLx::MoveToETagOrEof | ( | const TStr & | TagNm | ) |
void THtmlLx::MoveToStrOrEof | ( | const TStr & | Str | ) |
Definition at line 142 of file html.h.
References TVec< TVal, TSizeTy >::Add(), and TVec< TVal, TSizeTy >::SearchForw().
Referenced by THtmlDoc::_IsTagRedir().
|
inline |
Definition at line 126 of file html.h.
References TChA::Empty(), TChA::Pop(), and TChA::Push().
Referenced by GetEscCh(), GetSym(), and PutStr().
|
inline |
Definition at line 128 of file html.h.
References TStr::Len(), and PutCh().
Referenced by GetEscCh().
TArgNmValV THtmlLx::ArgNmValV |
|
private |
Definition at line 89 of file html.h.
Referenced by GetAsciiStr(), GetCh(), GetEscapedStr(), GetEscCh(), GetMetaTag(), GetSym(), and GetTag().
TChA THtmlLx::ChA |
Definition at line 109 of file html.h.
Referenced by THtmlDoc::_IsTagRedir(), GetFullBTagStr(), GetHRefBeforeStr(), GetNoTag(), GetStrToBTag(), GetStrToETag(), GetStrToETag2(), GetSym(), GetTag(), GetTextOnlyStrToEof(), GetTok(), GetTokStrV(), THtmlDoc::GetTxtLnDoc(), IsGetBTag(), IsGetETag(), MoveToStrOrEof(), and THtmlDoc::SaveHtmlToXml().
|
staticprivate |
Definition at line 84 of file html.h.
Referenced by GetEscCh(), GetSym(), and GetTag().
|
private |
Definition at line 91 of file html.h.
Referenced by GetEscCh(), and GetSym().
|
private |
Definition at line 92 of file html.h.
Referenced by GetEscCh().
TChA THtmlLx::PreSpaceChA |
Definition at line 113 of file html.h.
Referenced by THtmlDoc::GetRedirHtmlDocStr(), and GetSym().
int THtmlLx::PreSpaces |
Definition at line 112 of file html.h.
Referenced by GetNoTag(), GetStrToBTag(), GetStrToETag(), GetStrToETag2(), GetSym(), GetTextOnlyStrToEof(), and THtmlDoc::GetTxtLnDoc().
|
private |
Definition at line 85 of file html.h.
Referenced by GetNoTag(), and GetTokStrV().
THtmlLxSym THtmlLx::Sym |
Definition at line 107 of file html.h.
Referenced by THtmlDoc::_IsTagRedir(), GetFullBTagStr(), GetHRefBeforeStr(), GetMetaTag(), GetNoTag(), THtmlDoc::GetRedirHtmlDocStr(), GetStrToBTag(), GetStrToETag(), GetStrToETag2(), GetSym(), GetTag(), GetTextOnlyStrToEof(), GetTok(), GetTokStrV(), THtmlDoc::GetTxtLnDoc(), MoveToBTag2OrEof(), MoveToBTag3OrEof(), MoveToBTagArg2OrEof(), MoveToBTagArgOrEof(), MoveToBTagOrEof(), MoveToBTagOrETagOrEof(), MoveToETagOrEof(), MoveToStrOrEof(), THtmlDoc::SaveHtmlToXml(), and THtmlDoc::THtmlDoc().
TChA THtmlLx::SymChA |
Definition at line 111 of file html.h.
Referenced by GetCh(), THtmlDoc::GetRedirHtmlDocStr(), and GetSym().
TChA THtmlLx::UcChA |
Definition at line 110 of file html.h.
Referenced by GetHRefBeforeStr(), GetStrToBTag(), GetStrToETag(), GetStrToETag2(), GetSym(), GetTag(), GetTok(), MoveToBTag2OrEof(), MoveToBTag3OrEof(), MoveToBTagArg2OrEof(), MoveToBTagArgOrEof(), MoveToBTagOrEof(), MoveToBTagOrETagOrEof(), MoveToETagOrEof(), and THtmlDoc::THtmlDoc().