|
| CLemmatizerEnglish () |
|
virtual | ~CLemmatizerEnglish () |
|
| CLemmatizer (MorphLanguageEnum Language) |
|
virtual | ~CLemmatizer () |
|
MorphLanguageEnum | GetLanguage () const |
|
const CStatistic & | GetStatistic () const |
|
bool | CheckABC (const string &WordForm) const |
|
bool | IsHyphenPostfix (const string &Postfix) const |
|
bool | IsHyphenPrefix (const string &Prefix) const |
|
bool | initIconv (const string &enc_internal="", const string &enc_external="UTF8") |
|
std::string | recode_ext2int (const std::string s_ext) const |
|
std::string | recode_int2ext (const std::string s_int) const |
|
bool | LoadDictionariesRegistry (string &strError) |
|
bool | CreateParadigmCollection (bool bNorm, string &WordStr, bool capital, bool bUsePrediction, vector< CFormInfo > &Result) const |
|
void | GetAllAncodesQuick (const BYTE *WordForm, bool capital, BYTE *OutBuffer, bool bUsePrediction) const |
|
bool | GetAllAncodesAndLemmasQuick (string &InputWordStr, bool capital, char *OutBuffer, size_t MaxBufferSize, bool bUsePrediction) const |
|
| CMorphDict (MorphLanguageEnum Language) |
|
virtual | ~CMorphDict () |
|
void | InitAutomat (CMorphAutomat *pFormAutomat) |
|
bool | Load (string GrammarFileName) |
|
bool | Save (string GrammarFileName) const |
|
void | PredictBySuffix (const string &Text, size_t &TextOffset, size_t MinimalPredictSuffixlen, vector< CAutomAnnotationInner > &Infos) const |
|
string | GetAllMorphInterpsStr (const string &Text, const size_t TextPos, bool bFullInterp) const |
|
|
bool | m_bLoaded |
|
bool | m_bMaximalPrediction |
|
bool | m_bUseStatistic |
|
bool | m_bAllowRussianJo |
|
std::string | m_enc_int |
| internal encoding (default=""=none) More...
|
|
std::string | m_enc_ext |
| external encoding (default=""=none) More...
|
|
ddcIconv * | m_ic_ext2int |
| iconv converter from user encoding to morph-internal encoding More...
|
|
ddcIconv * | m_ic_int2ext |
| iconv converter from morph-internal encoding to user encoding More...
|
|
vector< CFlexiaModel > | m_FlexiaModels |
|
vector< CAccentModel > | m_AccentModels |
|
CShortStringHolder | m_Bases |
|
vector< CLemmaInfoAndLemma > | m_LemmaInfos |
|
StringVector | m_Prefixes |
|
vector< BYTE > | m_NPSs |
|
string | GetRegistryString () const |
|
string | GetPath () const |
|
void | ReadOptions (string FileName) |
|
bool | LemmatizeWord (string &InputWordStr, const bool cap, const bool predict, vector< CAutomAnnotationInner > &results, bool bGetLemmaInfos) const |
|
void | AssignWeightIfNeed (vector< CAutomAnnotationInner > &FindResults) const |
|
bool | CheckAbbreviation (string InputWordStr, vector< CAutomAnnotationInner > &FindResults, bool is_cap) const |
|
CAutomAnnotationInner | ConvertPredictTupleToAnnot (const CPredictTuple &input) const |
|
void | PredictByDataBase (string InputWordStr, vector< CAutomAnnotationInner > &results, bool is_cap) const |
|
bool | IsPrefix (const string &Prefix) const |
|
void | GetLemmaInfos (const string &Text, size_t TextPos, vector< CAutomAnnotationInner > &Infos) const |
|
void | CreateModelsIndex () |
|
string | m_Registry |
|
set< string > | m_HyphenPostfixes |
|
set< string > | m_HyphenPrefixes |
|
CStatistic | m_Statistic |
|
CPredictBase | m_Predict |
|
set< string > | m_PrefixesSet |
|
CMorphAutomat * | m_pFormAutomat |
|
vector< int > | m_ModelsIndex |
|
IsLessMorphInterp | m_SearchInfoLess |
|