ddc
|
#include "ddcConfig.h"
#include <stdint.h>
#include <stdio.h>
#include <assert.h>
#include <stdarg.h>
#include <string.h>
#include <ctype.h>
#include <string>
#include <algorithm>
#include <stdexcept>
#include <vector>
#include <typeinfo>
#include "set"
#include "stack"
#include "map"
#include "time.h"
#include <malloc.h>
#include <unistd.h>
#include "../CommonLib/ddcLocale.h"
#include "../CommonLib/ddcVersion.h"
#include "../CommonLib/ddcString.h"
Go to the source code of this file.
Classes | |
struct | troika< T1, T2, T3 > |
class | CExpc |
generic local exception class moo: derived from stdexcept runtime_error More... | |
class | CFatalExpc |
local exception class, fatal (can be used to force immediate bail-out) More... | |
struct | DDCProcessMemoryStatus |
Macros | |
#define | WIN32_LEAN_AND_MEAN |
#define | likely(x) x |
#define | unlikely(x) x |
#define | _QM(X) (((QWORD)1)<<X) |
Typedefs | |
typedef unsigned char | BYTE |
typedef uint32_t | DWORD |
typedef uint16_t | WORD |
typedef uint64_t | QWORD |
typedef unsigned int | UINT |
typedef vector< string > | StringVector |
typedef set< string > | StringSet |
typedef vector< DWORD > | DwordVector |
typedef QWORD | file_off_t |
Enumerations | |
enum | MorphLanguageEnum { morphUnknown = 0, morphRussian = 1, morphEnglish = 2, morphGerman = 3, morphGeneric = 4, morphURL =5, morphDigits =6 } |
enum | RegisterEnum { AnyRegister =0, LowLow =1, UpLow =2, UpUp =3 } |
Functions | |
QWORD | GetMaxQWORD () |
bool | FileExists (const char *FName) |
bool | FileExists (const string &FName) |
bool | IsDirectory (const char *DirName) |
bool | IsDirectory (const string &DirName) |
file_off_t | FileSize (const char *filename) |
file_off_t | FileSize (const string &filename) |
time_t | FileMTime (const char *filename) |
bool | FSeek (FILE *fp, file_off_t pos, int origin) |
file_off_t | FTell (FILE *fp) |
void | ErrorMessage (const string &Label, const string &Message) |
void | ErrorMessage (const string &Message) |
string | MakeFName (const string &InpitFileName, const string &Ext) |
bool | MakePath (const char *RossPath, const char *FileName, char *FullPath) |
string | GetPathByFile (string FileName) |
bool | IsBinFile (const char *FileName) |
bool | IsEmptyLine (const char *t) |
bool | IsHtmlFile (const string &FileName) |
bool | IsTableFile (const string &FileName) |
bool | IsJsonFile (const string &FileName) |
string | FileExtension (const string &FileName) |
string | FileDirectory (const string &FileName) |
Returns directory part of FileName, or "." if FileName is a bare filename, like dirname(3) More... | |
string | FileBasename (const string &FileName) |
Returns file part of FileName, like basename(3) More... | |
string | FileBasename (const string &FileName, const string &FileExtension) |
Returns basename FileName, removing any trailing extension FileExtension. More... | |
string | CurrentDirectory (void) |
Wrapper for getcwd(); returns current working directory of current process. More... | |
bool | IsAbsolutePath (const string &PathName) |
Returns true iff PathName is an absolute path (simple string heuristics) More... | |
string | RelativePathName (const string &RefDir, const string &PathName) |
If PathName is absolute, it is returned; otherwise returns (RefDir + "/" + PathName) More... | |
string | RelativeFileName (const string &RefFile, const string &PathName) |
If PathName is absolute, it is returned; otherwise returns (FileDirectory(RefFile) + "/" + PathName) More... | |
void | AddFile (const char *MainFile, const char *ToAdd) |
AddFile(): old ugly file-append hack using system("cat...") More... | |
void | FileAppend (FILE *src, FILE *dst) |
FileAppend(): newer better replacement for AddFile() More... | |
void | FileAppend (const char *srcFile, const char *dstFile) |
void | FileAppend (const string &srcFile, const string &dstFile) |
void | FileAppendPartial (FILE *src, FILE *dst, size_t nBytes) |
FileAppendPartial(): append a substring of src to dst. More... | |
bool | RmlMoveFile (const char *oldpath, const char *newpath) |
bool | RmlCopyFile (const char *oldpath, const char *newpath) |
string | CreateTempFileName () |
bool | MakeDir (const string &DirName) |
bool | MakeDirP (const string &DirName) |
bool | RemoveWithPrint (const string &FileName) |
size_t | GetNumberOfOpenFiles (pid_t pid=0) |
string | GetRegistryString (string RegistryPath) |
bool | CanGetRegistryString (string RegistryPath) |
bool | IsRmlRegistered (string &Error) |
struct tm | RmlGetCurrentTime () |
string | GetIniFilePath () |
string | GetRmlVariable () |
char * | rtrim (char *s) |
bool | IsSuperEqualChar (BYTE ch1, BYTE ch2, MorphLanguageEnum langua) |
int | CompareWithoutRegister (const char *s1, const char *s2, size_t l, MorphLanguageEnum langua) |
BYTE | force_rus_char (BYTE ch) |
bool | force_to_rus (char *dest, const char *sour, size_t len) |
char * | IntToStr (int Value, char *Buffer) |
string & | IntToStr (int Value, string &oBuffer) |
string & | TrimLeft (string &str) |
string & | TrimRight (string &str) |
string & | Trim (string &str) |
bool | LoadFileToString (string FileName, string &Result, bool clobber=true) |
bool | SaveStringToFile (const string &Str, const string &FileName) |
void | KOI8ToWin (string &s) |
void | WinToKOI8 (string &s) |
bool | StartsWith (const string &body, const string &prefix) |
string | timestampLocal (time_t timeval) |
moo: timestamp stuff More... | |
string | timestampUTC (time_t timeval) |
vector< string > | stringSplit (const char *s, const char *delims) |
moo: convenience wrapper for string-to-vector tokenization using StringTokenizer More... | |
void | stringSplitE (const string &s, const string &delims, vector< string > &tokens) |
vector< string > | stringSplitE (const string &s, const string &delims) |
moo: stringSplitE() variant returning token-vector More... | |
uint32_t | date2int (signed int y, unsigned int m=1, unsigned int d=1) |
moo: date-to-int encoding (v2.2.4: use signed years) More... | |
void | int2date (uint32_t i, signed int *y, unsigned int *m=NULL, unsigned int *d=NULL) |
moo: int-to-date decoding (v2.2.4: use signed years) More... | |
string | int2hex (int32_t i) |
moo: int-to-hexidecimal string encoding; encoding preserves sort order (for subcorpus->server communications) More... | |
int32_t | hex2int (const string &s) |
moo: int-to-hexidecimal string deccoding; ; encoding preserves sort order More... | |
void | ddc_thread_init (const char *log_label=NULL) |
register a thread-local log prefix (unix only) More... | |
const char * | ddc_log_label (void) |
get thread-local log prefix, or empty string if none registered More... | |
const char * | ddc_set_log_label (const char *log_label) |
set thread-local log prefix; returns old label (if any) More... | |
int | GetPredictionPartOfSpeech (const string &PartOfSpeech, MorphLanguageEnum langua) |
bool | GetLanguageByString (string s, MorphLanguageEnum &Result) |
string | GetStringByLanguage (MorphLanguageEnum Langua) |
uint32_t | log2u32 (uint32_t v) |
template<class VecT > | |
size_t | VectorStride (const VecT &v) |
void | TrimHeap () |
template<class ContainerT > | |
void | ClearContainer (ContainerT &C) |
template<class T > | |
void | ClearVector (vector< T > &V) |
void | ClearString (string &S) |
int | isbracket (BYTE x) |
size_t | dual_bracket (BYTE x) |
bool | is_pseudo_graph (BYTE x) |
bool | is_spc_fill (BYTE x) |
bool | is_english_upper (BYTE x) |
bool | is_english_lower (BYTE x) |
bool | is_german_upper (BYTE x) |
bool | is_german_lower (BYTE x) |
bool | is_russian_upper (BYTE x) |
bool | is_russian_lower (BYTE x) |
bool | is_upper_consonant (BYTE x, MorphLanguageEnum Langua) |
bool | is_lower_vowel (BYTE x, MorphLanguageEnum Langua) |
bool | is_upper_vowel (BYTE x, MorphLanguageEnum Langua) |
bool | is_english_alpha (BYTE x) |
bool | is_russian_alpha (BYTE x) |
bool | is_german_alpha (BYTE x) |
bool | is_alpha (BYTE x) |
bool | is_alpha (BYTE x, MorphLanguageEnum langua) |
bool | is_lower_alpha (BYTE x, MorphLanguageEnum langua) |
bool | is_upper_alpha (BYTE x, MorphLanguageEnum langua) |
bool | isnspace (BYTE x) |
BYTE | etoupper (BYTE ch) |
BYTE | etolower (BYTE ch) |
BYTE | rtoupper (BYTE ch) |
BYTE | rtolower (BYTE ch) |
BYTE | gtoupper (BYTE ch) |
BYTE | gtolower (BYTE ch) |
BYTE | ReverseChar (BYTE ch, MorphLanguageEnum langua) |
string & | EngMakeUpper (string &word) |
string & | EngMakeLower (string &word) |
string & | EngRusMakeLower (string &word) |
char * | RmlMakeUpper (char *word, MorphLanguageEnum langua) |
string & | RmlMakeUpper (string &word, MorphLanguageEnum langua) |
string & | RmlMakeLower (string &word, MorphLanguageEnum langua) |
string & | EngRusMakeUpper (string &word) |
char * | EngRusMakeUpper (char *word) |
bool | IsRussian (const char *word) |
bool | CheckLanguage (const char *word, MorphLanguageEnum langua) |
void | ConvertJO2Je (string &src) |
void | ConvertJO2Je (char *src, size_t Length) |
string | ConvertASCIIToHtmlSymbols (const string &txt) |
template<class T , class Pred , class Conv > | |
T & | RegisterConverter (T &word, size_t Len, Pred P, Conv C) |
template<class T > | |
T & | GerEngRusMakeUpperTemplate (T &word, MorphLanguageEnum Langua, size_t Len) |
Variables | |
const unsigned int | _MAX_PATH = 512 |
const BYTE | cHyphenChar = (BYTE) '-' |
const BYTE | cParagraph = (BYTE) 21 |
const BYTE | cCompanyChar = (BYTE) 176 |
const BYTE | cIonChar = (BYTE) 183 |
const BYTE | cNumberChar = (BYTE) 0xB9 |
const BYTE | cPiChar = (BYTE) 182 |
const BYTE | cEllipseChar = (BYTE) 133 |
const BYTE | UnknownPartOfSpeech = 0xff |
const BYTE | Auml = 196 |
const BYTE | auml = 228 |
const BYTE | Uuml = 220 |
const BYTE | uuml = 252 |
const BYTE | Ouml = 214 |
const BYTE | ouml = 246 |
const BYTE | szlig = 223 |
const BYTE | Nu = 181 |
const BYTE | agrave = 224 |
const BYTE | egrave = 232 |
const BYTE | eacute = 233 |
const BYTE | LowerJO_cp1251 = 184 |
const BYTE | UpperJO_cp1251 = 168 |
const BYTE | LowerE_cp1251 = 229 |
const BYTE | UpperE_cp1251 = 197 |
const BYTE | Apostrophe = 39 |
#define WIN32_LEAN_AND_MEAN |
#define likely | ( | x | ) | x |
#define unlikely | ( | x | ) | x |
Referenced by CQCountKeyExprDateSlice::Evaluate().
#define _QM | ( | X | ) | (((QWORD)1)<<X) |
Referenced by ConvertToPlural(), CGraLine::DelDes(), FiniteFormCoordRussian(), GenderNumber(), GenderNumberCaseAnimRussian(), GenderNumberCaseNotAnimRussian(), GenderNumberGerman(), GetGramInfosFromWord(), CGraphmatFile::GetGraphematicalLine(), CRusGramTab::GleicheGenderNumberCase(), CAgramtab::grammems_to_str(), CUnitHolder::HasDescr(), CGraLine::HasMacroSyntaxDelimiter(), CRusGramTab::is_morph_personal_pronoun(), CGraLine::IsWordOrNumberOrAbbr(), MixedGleiche(), CAgramtab::ProcessPOSAndGrammems(), CRusGramTab::ProcessPOSAndGrammems(), CGraLine::SetDes(), SoloGleiche(), SubjectPredicate(), SubjectPredicateGerman(), and WeakGleiche().
typedef unsigned char BYTE |
typedef uint32_t DWORD |
typedef uint16_t WORD |
typedef uint64_t QWORD |
typedef unsigned int UINT |
typedef vector<string> StringVector |
typedef set<string> StringSet |
typedef vector<DWORD> DwordVector |
typedef QWORD file_off_t |
enum MorphLanguageEnum |
enum RegisterEnum |
|
inline |
bool FileExists | ( | const char * | FName | ) |
Referenced by CHitBorders::CBreakCollection::ClearAll(), CHost::CreateSocket(), CConcIndexator::DestroyIndex(), CStringIndexSet::DestroyIndexSet(), CIndexSetForQueryingStage::DestroyIndexSet(), FileExists(), CConcXml::FinalSaveBibliography(), IsRmlRegistered(), MorphoWizard::load_gramtab(), CConcordance::LoadCorpusFiles(), LoadHosts(), CIndexSetForQueryingStage::LoadIndexSet(), CConcordance::LoadMaskedFiles(), main(), MakePath(), ddcStringEnum< OffT_ >::open(), ddcCorpusList< OffT_ >::open(), CHitBorders::RemoveHitBordersFileAndClear(), RemoveWithPrint(), CConcXml::UnionBibliographies(), and CFatalExpc::~CFatalExpc().
|
inline |
bool IsDirectory | ( | const char * | DirName | ) |
Referenced by FileExists(), IsDirectory(), and MakeDirP().
|
inline |
file_off_t FileSize | ( | const char * | filename | ) |
References FSeek(), and FTell().
Referenced by FileSize(), CIndexSetForQueryingStage::GetOccurrsFileSize(), IsDirectory(), CShortStringHolder::ReadShortStringHolder(), ReadVector(), CConcXml::SplitBibliography(), and CConcXml::UnionBibliographies().
|
inline |
References AddFile(), CreateTempFileName(), CurrentDirectory(), ErrorMessage(), FileAppend(), FileAppendPartial(), FileBasename(), FileDirectory(), FileExtension(), FileMTime(), FileSize(), FSeek(), FTell(), GetPathByFile(), IsAbsolutePath(), IsBinFile(), IsEmptyLine(), IsHtmlFile(), IsJsonFile(), IsTableFile(), MakeDir(), MakeDirP(), MakeFName(), MakePath(), RelativeFileName(), RelativePathName(), RemoveWithPrint(), RmlCopyFile(), and RmlMoveFile().
time_t FileMTime | ( | const char * | filename | ) |
Referenced by FileSize(), and CConcordance::UpdateTimestamp().
bool FSeek | ( | FILE * | fp, |
file_off_t | pos, | ||
int | origin | ||
) |
Referenced by FileSize(), ddcFileOrMMap::ReadFromFile(), CIndexSetForLoadingStage::RollbackLoadIndex(), and CConcXml::SplitBibliography().
file_off_t FTell | ( | FILE * | fp | ) |
Referenced by FileSize(), and CItemIndexForLoading::ReadFromTemporalFile().
void ErrorMessage | ( | const string & | Label, |
const string & | Message | ||
) |
Referenced by CIndexSetForQueryingStage::AssertHasPath(), CConcordance::AssertHasPath(), CGraphanDicts::BuildOborot(), CGraphanDicts::BuildOborottos(), MorphoWizard::check_paradigm(), CItemIndexForLoading::CheckOccurrences(), CShortStringHolder::CreateFromSequence(), CreateMorphIndex(), CMyTimeSpanHolder::EndTimer(), TItemContainer::ErrorMessage(), ErrorMessage(), FileSize(), MorphoWizard::find_lemm(), MorphoWizard::find_wordforms(), CConcSession::GenerateOneHitString(), CConcSession::GenerateOneHitStringJson(), CMorphDictBuilder::GenPredictIdx(), CConcSession::GetContext(), CConcSession::GetContextJson(), TItemContainer::GetDomItemStr(), CDDCBranchServer::GetFirstHitsFromCorpora(), CConcSession::GetHits(), CDDCBranchServer::GetHitStringsFromOneCorpus(), CConcSession::GetOccurrences(), InitAlphabet(), CMorphDict::Load(), CMorphAutomat::Load(), MorphoWizard::predict_lemm(), ReadXmlField(), CBiblIndex::RegisterFreeBiblAttributes(), CStringIndexator::RegisterStringIndices(), CMorphDict::Save(), CMorphAutomat::Save(), CDDCBranchServer::SendGetHitStringsRequest(), CConcSession::SimpleQuery(), CHitBorders::StartIndexing(), and WriteVector().
void ErrorMessage | ( | const string & | Message | ) |
string MakeFName | ( | const string & | InpitFileName, |
const string & | Ext | ||
) |
Referenced by CIndexSetForLoadingStage::AddMemoryLoadIndexToMainLoadIndex(), CConcIndexator::CreateAsUnion(), CIndexSetForLoadingStage::CreateTempFiles(), FileSize(), CBiblIndex::GetBiblDateIndexFileName(), CBiblIndex::GetBiblFileName(), CBiblIndex::GetBiblIndexFileName(), CHitBorders::CBreakCollection::GetBreakFileName(), ConcIndexatorInvoker::GetErrorLogFileName(), CConcordance::GetFileNameForCorpusFileNames(), CIndexSetForQueryingStage::GetFileNameForInfos(), CConcordance::GetFileNameForMaskedFileIds(), CConcordance::GetFileNameForMaskedFiles(), CFreeBiblIndex::GetIndexFileName(), CIndexSetForQueryingStage::GetOccHdrFileName(), CIndexSetForQueryingStage::GetOccursFileName(), CHitBorders::GetPageBreaksFileName(), CIndexSetForQueryingStage::GetPeriodsDivisionFileName(), CStringIndexator::GetSearchPeriodsFileName(), CStringIndexSet::GetStorageFileName(), CFreeBiblStringIndex::GetStringFileName(), CIndexSetForQueryingStage::GetSuffixFileName(), ConcIndexatorInvoker::GetTimeStatisticsFileName(), CDDCLeafServer::handle__info(), CMorphDict::Load(), CConcordance::LoadSourceFilesAndOptions(), main(), CGraphanDicts::ReadAbbrevations(), CMorphDict::Save(), CConcordance::SaveOptions(), and CConcIndexator::SplitProject().
bool MakePath | ( | const char * | RossPath, |
const char * | FileName, | ||
char * | FullPath | ||
) |
References FileExists().
Referenced by FileSize(), TRoss::FullLoad(), TRoss::LoadOnlyConstants(), and TRoss::ReadUnitComments().
string GetPathByFile | ( | string | FileName | ) |
Referenced by ConcIndexatorInvoker::BuildIndex(), FileSize(), MorphoWizard::get_predict_src_file_path(), and GetFullPathByName().
bool IsBinFile | ( | const char * | FileName | ) |
Referenced by TRoss::BuildCorteges(), TRoss::BuildUnits(), FileSize(), and TRoss::ReadUnitComments().
bool IsEmptyLine | ( | const char * | t | ) |
Referenced by FileSize(), and TRoss::ReadFromStrWithOneSignatura().
bool IsHtmlFile | ( | const string & | FileName | ) |
References EngMakeLower(), and FileExtension().
Referenced by FileSize(), and CIndexDocument::NormalizeDocumentBuffer().
bool IsTableFile | ( | const string & | FileName | ) |
References EngMakeLower(), and FileExtension().
Referenced by FileSize().
bool IsJsonFile | ( | const string & | FileName | ) |
References EngMakeLower(), and FileExtension().
Referenced by FileSize().
string FileExtension | ( | const string & | FileName | ) |
Referenced by FileSize(), IsHtmlFile(), IsJsonFile(), and IsTableFile().
string FileDirectory | ( | const string & | FileName | ) |
Returns directory part of FileName, or "." if FileName is a bare filename, like dirname(3)
Referenced by FileSize(), MakeDirP(), RelativeFileName(), and CConcIndexator::SplitProject().
string FileBasename | ( | const string & | FileName | ) |
Returns file part of FileName, like basename(3)
Referenced by FileBasename(), FileSize(), and CDDCLeafServer::handle__info().
string FileBasename | ( | const string & | FileName, |
const string & | FileExtension | ||
) |
Returns basename FileName, removing any trailing extension FileExtension.
References FileBasename().
string CurrentDirectory | ( | void | ) |
Wrapper for getcwd(); returns current working directory of current process.
Referenced by do_start(), and FileSize().
bool IsAbsolutePath | ( | const string & | PathName | ) |
Returns true iff PathName is an absolute path (simple string heuristics)
Referenced by FileSize(), and RelativePathName().
string RelativePathName | ( | const string & | RefDir, |
const string & | PathName | ||
) |
If PathName is absolute, it is returned; otherwise returns (RefDir + "/" + PathName)
References IsAbsolutePath().
Referenced by FileSize(), and RelativeFileName().
string RelativeFileName | ( | const string & | RefFile, |
const string & | PathName | ||
) |
If PathName is absolute, it is returned; otherwise returns (FileDirectory(RefFile) + "/" + PathName)
References FileDirectory(), and RelativePathName().
Referenced by FileSize(), CDDCLeafServer::handle__info(), CConcordance::LoadOptionsFromString(), CSourceFileHolder::ReadSourceFileList(), and CDDCServerOptions::Set().
void AddFile | ( | const char * | MainFile, |
const char * | ToAdd | ||
) |
AddFile(): old ugly file-append hack using system("cat...")
References _MAX_PATH.
Referenced by FileSize().
void FileAppend | ( | FILE * | src, |
FILE * | dst | ||
) |
FileAppend(): newer better replacement for AddFile()
References DDC_STATIC_BUFLEN.
Referenced by FileAppend(), FileSize(), and CConcXml::UnionBibliographies().
void FileAppend | ( | const char * | srcFile, |
const char * | dstFile | ||
) |
void FileAppend | ( | const string & | srcFile, |
const string & | dstFile | ||
) |
void FileAppendPartial | ( | FILE * | src, |
FILE * | dst, | ||
size_t | nBytes | ||
) |
FileAppendPartial(): append a substring of src to dst.
References DDC_STATIC_BUFLEN, and Format().
Referenced by FileSize(), and CConcXml::SplitBibliography().
bool RmlMoveFile | ( | const char * | oldpath, |
const char * | newpath | ||
) |
References RmlCopyFile().
Referenced by CIndexSetForLoadingStage::AddMemoryLoadIndexToMainLoadIndex(), and FileSize().
bool RmlCopyFile | ( | const char * | oldpath, |
const char * | newpath | ||
) |
string CreateTempFileName | ( | ) |
bool MakeDir | ( | const string & | DirName | ) |
bool MakeDirP | ( | const string & | DirName | ) |
References FileDirectory(), Format(), IsDirectory(), MakeDir(), and MakeDirP().
Referenced by FileSize(), MakeDirP(), and CConcIndexator::SplitProject().
bool RemoveWithPrint | ( | const string & | FileName | ) |
References FileExists().
Referenced by CIndexSetForLoadingStage::DeleteTempFiles(), and FileSize().
size_t GetNumberOfOpenFiles | ( | pid_t | pid = 0 | ) |
return the number of open files for pid (linux only).
Referenced by DDCProcessMemoryStatus::fetch(), CDDCLeafServer::handle__status(), and CDDCBranchServer::handle__status().
string GetRegistryString | ( | string | RegistryPath | ) |
References GetIniFilePath(), GetRmlVariable(), and GetStringInnerFromTheFile().
Referenced by CanGetRegistryString(), CreateLockFile(), ddcLog(), DDCProcessMemoryStatus::fetch(), GetThesaurusPath(), CGraphmatFile::LoadDicts(), CGraphanDicts::ReadAbbrevations(), and CAgramtab::RegistryFilename().
bool CanGetRegistryString | ( | string | RegistryPath | ) |
References GetRegistryString().
Referenced by DDCProcessMemoryStatus::fetch(), and GetThesaurusPath().
bool IsRmlRegistered | ( | string & | Error | ) |
References FileExists(), GetIniFilePath(), CExpc::m_strCause, and RML_REGISTRY_FILENAME.
Referenced by DDCProcessMemoryStatus::fetch(), LoadDDCServer(), LoadLocalCorpora(), and main().
struct tm RmlGetCurrentTime | ( | ) |
References DDCTimeUnix::CalendarTime(), and DDCTimeUnix::Now().
Referenced by TUnitComment::TUnitComment().
string GetIniFilePath | ( | ) |
References GetRmlVariable().
Referenced by DDCProcessMemoryStatus::fetch(), GetRegistryString(), IsRmlRegistered(), LoadDDCServer(), LoadLocalCorpora(), and main().
string GetRmlVariable | ( | ) |
References Trim().
Referenced by BuildRMLPath(), DDCProcessMemoryStatus::fetch(), GetIniFilePath(), GetRegistryString(), and CLemmatizer::LoadDictionariesRegistry().
char* rtrim | ( | char * | s | ) |
Referenced by TItemContainer::BuildDomens(), TItemContainer::BuildFields(), DDCProcessMemoryStatus::fetch(), CDwdsThesaurus::LoadDwdsThesaurus(), CGraphanDicts::ReadExtensions(), TRoss::ReadFromStrWithOneSignatura(), CGraphanDicts::ReadKeyboard(), CGraphanDicts::ReadSpaces(), and CDocumentIterator::ReadTabFormatDocument().
bool IsSuperEqualChar | ( | BYTE | ch1, |
BYTE | ch2, | ||
MorphLanguageEnum | langua | ||
) |
References is_english_upper(), is_russian_upper(), ReverseChar(), and rtolower().
Referenced by DDCProcessMemoryStatus::fetch(), CGraphmatFile::FindKeySequence(), and StrSpacingCompare().
int CompareWithoutRegister | ( | const char * | s1, |
const char * | s2, | ||
size_t | l, | ||
MorphLanguageEnum | langua | ||
) |
References ReverseChar().
Referenced by DDCProcessMemoryStatus::fetch(), and CGraphanDicts::FindInIdents().
Referenced by DDCProcessMemoryStatus::fetch(), and force_to_rus().
bool force_to_rus | ( | char * | dest, |
const char * | sour, | ||
size_t | len | ||
) |
References force_rus_char(), and is_russian_alpha().
Referenced by DDCProcessMemoryStatus::fetch(), and CGraphmatFile::InitNonContextDescriptors().
char* IntToStr | ( | int | Value, |
char * | Buffer | ||
) |
Referenced by DDCProcessMemoryStatus::fetch(), and CGraphmatFile::GetGraphematicalLine().
string& IntToStr | ( | int | Value, |
string & | oBuffer | ||
) |
string& TrimLeft | ( | string & | str | ) |
Referenced by DDCProcessMemoryStatus::fetch(), and Trim().
string& TrimRight | ( | string & | str | ) |
Referenced by DDCProcessMemoryStatus::fetch(), CSocketAddr::ParseAddrPort(), and Trim().
string& Trim | ( | string & | str | ) |
References TrimLeft(), and TrimRight().
Referenced by CBiblIndex::AddBiblExpander(), AddMessage(), MorphoWizard::AddPrefixSet(), BuildHtmlHitStrWithHighlighting(), MorphoWizard::check_common_grammems(), MorphoWizard::check_prefixes(), CQueryTokenNode::CreateFileList(), CRunQueryData::CRunQueryData(), DeleteEmptyLines(), DDCProcessMemoryStatus::fetch(), MorphoWizard::find_wordforms(), CHitBorders::GetBorderIndicesString(), GetCWBFormattedStringRecursive(), CDDCBranchServer::GetHitContexts(), CDDCBranchServer::GetHitStringsFromOneCorpus(), CStringIndexator::GetIndicesString(), GetInterfacePOS(), GetLogLevel(), GetRmlVariable(), GetStringInnerFromTheFile(), GetTextFromXMLRecursive(), GetValue(), CDictionary::ImportFromText(), CConcIndexator::IndexOneTableTextArea(), CTabFormatIndexator::IndexTabFormat(), CRunQueryData::Init(), CMorphDict::Load(), CConcordance::LoadCorpusFiles(), LoadHosts(), CConcordance::LoadMaskedFiles(), newTermExpander(), NormalizeOborotStr(), ddcStringEnum< OffT_ >::openCompat(), ddcCorpusList< OffT_ >::openCompat(), CTabFormatIndexator::ProcessMetaField(), ReadAbbrevationsFromOneFile(), TRoss::ReadConfig(), ReadFlexiaModels(), CDumpParadigm::ReadFromFile(), CBibliography::ReadFromString(), CHost::ReadFromString(), CHighlightTags::ReadFromString(), CFlexiaModel::ReadFromString(), CGraphanDicts::ReadIdents(), CConcXml::ReadMorphXmlFileIntoGraTable(), MorphoWizard::ReadOnePrefixSet(), CLemmatizer::ReadOptions(), CDwdsThesaurus::ReadPathFromString(), CDDCBranchServer::ReadSelectedHosts(), CSourceFileHolder::ReadSourceFileList(), ReadTabFormatDocumentName(), ReadXmlField(), CFreeBiblStringIndex::RegisterBiblStringItemId(), CHitBorders::RegisterBorderIndices(), CBiblIndex::RegisterFreeBiblAttributes(), CStringIndexator::RegisterIndexAliases(), CStringIndexator::RegisterStringIndices(), CBiblIndex::RegisterTextAreas(), TxLang::setLanguage(), and MorphoWizard::slf_to_mrd().
bool LoadFileToString | ( | string | FileName, |
string & | Result, | ||
bool | clobber = true |
||
) |
References ReadVector().
Referenced by DDCProcessMemoryStatus::fetch(), CDDCLeafServer::handle__info(), CConcordance::LoadCorpusFiles(), CDDCServerOptions::LoadFile(), CConcordance::LoadOptionsFromFile(), CConcordance::LoadOptionsFromString(), CConcordance::LoadSourceFilesAndOptions(), and CLemmatizer::ReadOptions().
bool SaveStringToFile | ( | const string & | Str, |
const string & | FileName | ||
) |
References WriteVector().
Referenced by DDCProcessMemoryStatus::fetch(), and CConcIndexator::SplitProject().
void KOI8ToWin | ( | string & | s | ) |
References ktw().
Referenced by DDCProcessMemoryStatus::fetch().
void WinToKOI8 | ( | string & | s | ) |
References wtk().
Referenced by DDCProcessMemoryStatus::fetch().
bool StartsWith | ( | const string & | body, |
const string & | prefix | ||
) |
Referenced by DDCProcessMemoryStatus::fetch(), CTabFormatIndexator::IndexTabFormat(), CSocketAddr::ParseSocketAddr(), CTabFormatIndexator::ProcessMetaField(), and ReadTabFormatDocumentName().
string timestampLocal | ( | time_t | timeval | ) |
moo: timestamp stuff
Referenced by DDCProcessMemoryStatus::fetch().
string timestampUTC | ( | time_t | timeval | ) |
Referenced by DDCProcessMemoryStatus::fetch(), CDDCLeafServer::handle__info(), CDDCLeafServer::handle__status(), and CDDCBranchServer::handle__status().
vector<string> stringSplit | ( | const char * | s, |
const char * | delims | ||
) |
moo: convenience wrapper for string-to-vector tokenization using StringTokenizer
References StringTokenizer::get_tokens().
Referenced by TxDispatcher::addExpander(), CDDCBranchServer::AlignCorpusPath(), TxCab::compile(), ddc_parse_format_version(), DDCProcessMemoryStatus::fetch(), TxDispatcher::getChain(), CDDCLeafServer::handle__expand_terms(), IndexOneToken(), CStringIndexator::IndexTokenFixLongColumns(), CDDCServer::ProcessSocketString(), SubcorpusRequestRegex(), and TruncateLongColumns().
void stringSplitE | ( | const string & | s, |
const string & | delims, | ||
vector< string > & | tokens | ||
) |
moo: split a string using std::string() methods only, allowing empty tokens
Referenced by CQKeys::Compile(), do_start(), DDCProcessMemoryStatus::fetch(), CDDCServerOptions::LoadString(), and stringSplitE().
vector<string> stringSplitE | ( | const string & | s, |
const string & | delims | ||
) |
moo: stringSplitE() variant returning token-vector
References stringSplitE().
uint32_t date2int | ( | signed int | y, |
unsigned int | m = 1 , |
||
unsigned int | d = 1 |
||
) |
moo: date-to-int encoding (v2.2.4: use signed years)
Referenced by CBibliography::ConvertDateToInt(), and DDCProcessMemoryStatus::fetch().
void int2date | ( | uint32_t | i, |
signed int * | y, | ||
unsigned int * | m = NULL , |
||
unsigned int * | d = NULL |
||
) |
moo: int-to-date decoding (v2.2.4: use signed years)
Referenced by CQCountKeyExprDate::Evaluate(), CQCountKeyExprDateSlice::Evaluate(), and DDCProcessMemoryStatus::fetch().
string int2hex | ( | int32_t | i | ) |
moo: int-to-hexidecimal string encoding; encoding preserves sort order (for subcorpus->server communications)
Referenced by DDCProcessMemoryStatus::fetch(), CConcSession::GetHitIds(), and CConcSession::GetSortKeyHint().
int32_t hex2int | ( | const string & | s | ) |
moo: int-to-hexidecimal string deccoding; ; encoding preserves sort order
Referenced by DDCProcessMemoryStatus::fetch(), CFreeBiblIndex::GetIntegerLowerBound(), and CConcSession::SortKeyLB().
void ddc_thread_init | ( | const char * | log_label = NULL | ) |
register a thread-local log prefix (unix only)
References ddc_loglabel_key, ddc_thread_data_alloc(), and ddc_thread_data_once.
Referenced by do_start(), DDCProcessMemoryStatus::fetch(), ListenerThread(), main(), and CDDCServerThread::run().
const char* ddc_log_label | ( | void | ) |
get thread-local log prefix, or empty string if none registered
References ddc_loglabel_key.
Referenced by ddc_set_log_label(), ddcLog(), and DDCProcessMemoryStatus::fetch().
const char* ddc_set_log_label | ( | const char * | log_label | ) |
set thread-local log prefix; returns old label (if any)
References ddc_log_label(), and ddc_loglabel_key.
Referenced by DDCProcessMemoryStatus::fetch().
int GetPredictionPartOfSpeech | ( | const string & | PartOfSpeech, |
MorphLanguageEnum | langua | ||
) |
References morphEnglish, morphGerman, morphRussian, predict_eng_pos, predict_ger_pos, predict_poses_size, predict_rus_pos, and UnknownPartOfSpeech.
Referenced by CMorphDictBuilder::GenerateUnitedFlexModels(), CMorphDictBuilder::GenPredictIdx(), and MorphoWizard::predict_lemm().
bool GetLanguageByString | ( | string | s, |
MorphLanguageEnum & | Result | ||
) |
References EngRusMakeUpper(), morphEnglish, morphGeneric, morphGerman, morphRussian, and morphURL.
Referenced by MorphoWizard::load_wizard(), CConcordance::LoadOptionsFromString(), and TxLang::setLanguage().
string GetStringByLanguage | ( | MorphLanguageEnum | Langua | ) |
References morphEnglish, morphGeneric, morphGerman, morphRussian, and morphURL.
Referenced by TxDispatcher::ensureDefaultExpanders(), CMorphDictBuilder::GenPredictIdx(), CDDCLeafServer::handle__info(), InitMorphologySystem(), CMorphAutomat::Load(), MorphoWizard::load_gramtab(), MorphoWizard::load_static(), CConcordance::LoadOptionsFromString(), CConcordance::SaveOptionsToString(), and TxLang::setLanguage().
|
inline |
fast approximation of base-2 logarithm for unsigned integers (= most significant bit)
Referenced by CQueryNode::ConvertOccurrencesToHits(), CQueryBinaryOperationNode::hits_and_positions_difference(), CQueryBinaryOperationNode::hits_and_positions_intersection(), CConcSession::InitFileReferences(), and CQTokenOccurrenceIterator::seek().
|
inline |
get average size of gap between elements of v[]
v | vector of numeric types castable to (size_t), sorted in ascending order, implicit start=0 (e.g. ddcBreakVector) |
Referenced by CQueryNode::ConvertOccurrencesToHits(), and CConcSession::InitFileReferences().
|
inline |
void ClearContainer | ( | ContainerT & | C | ) |
Referenced by CConcSessionContext::CacheClear(), CShortOccurCache::Clear(), CSelectedHosts::Clear(), ClearString(), ClearVector(), CFreeBiblStringIndex::CreatePartitions(), and CConcSession::GetAllHits().
|
inline |
References ClearContainer().
Referenced by CFirstHitsQueryResult::Clear(), CSelectedHosts::Clear(), CUnitHolder::ClearInputBuffer(), CItemIndexForLoading::ClearOccurrences(), CQueryResult::ClearQueryResults(), ddcStringEnum< OffT_ >::close(), ddcCorpusList< OffT_ >::close(), ddcVecFile< CIndexItem >::close(), CStringIndexSet::CreateSplitPartitions(), do_start(), ddcCorpusList< OffT_ >::ensureVec(), ddcVecFile< CIndexItem >::ensureVec(), CUnitHolder::FreeTable(), ddcStringEnum< OffT_ >::to_vector(), and CQueryNode::~CQueryNode().
|
inline |
References ClearContainer(), dual_bracket(), is_english_lower(), is_english_upper(), is_pseudo_graph(), is_spc_fill(), and isbracket().
Referenced by NavHintKey::clear(), CFreeBiblStringConstant::clear(), CRunQueryData::Clear(), CConcSession::ClearQueryResults(), ddcMMap< CIndexItem >::close(), and ddcCorpusList< OffT_ >::close().
int isbracket | ( | BYTE | x | ) |
References close_brackets, and open_brackets.
Referenced by ClearString(), CGraphmatFile::InitNonContextDescriptors(), and CGraLine::ReadWord().
size_t dual_bracket | ( | BYTE | x | ) |
References all_brackets, and open_brackets.
Referenced by ClearString(), and CGraphmatFile::DealSentBreaker().
bool is_pseudo_graph | ( | BYTE | x | ) |
bool is_spc_fill | ( | BYTE | x | ) |
Referenced by ClearString(), CGraLine::ReadWord(), and StrSpacingCompare().
bool is_english_upper | ( | BYTE | x | ) |
References ASCII, and EngUpper.
Referenced by ClearString(), EngMakeLower(), gtolower(), is_english_alpha(), is_upper_alpha(), CUnitHolder::is_uppercase(), IsSuperEqualChar(), and ReverseChar().
bool is_english_lower | ( | BYTE | x | ) |
References ASCII, and EngLower.
Referenced by ClearString(), EngMakeUpper(), EngRusMakeUpper(), GerEngRusMakeUpperTemplate(), gtoupper(), is_english_alpha(), is_lower_alpha(), CUnitHolder::is_lowercase(), and ReverseChar().
bool is_german_upper | ( | BYTE | x | ) |
References ASCII, and GerUpper.
Referenced by is_german_alpha(), is_upper_alpha(), CUnitHolder::is_uppercase(), and RmlMakeLower().
bool is_german_lower | ( | BYTE | x | ) |
References ASCII, and GerLower.
Referenced by GerEngRusMakeUpperTemplate(), is_german_alpha(), is_lower_alpha(), and CUnitHolder::is_lowercase().
bool is_russian_upper | ( | BYTE | x | ) |
References ASCII, and RusUpper.
Referenced by TItemContainer::CanBeRusAbbr(), EngRusMakeLower(), is_russian_alpha(), is_russian_upper_consonant(), is_upper_alpha(), CUnitHolder::is_uppercase(), IsSuperEqualChar(), ReverseChar(), and rtolower().
bool is_russian_lower | ( | BYTE | x | ) |
References ASCII, and RusLower.
Referenced by EngRusMakeUpper(), GerEngRusMakeUpperTemplate(), is_lower_alpha(), CUnitHolder::is_lowercase(), is_russian_alpha(), is_russian_lower_consonant(), ReverseChar(), and rtoupper().
bool is_upper_consonant | ( | BYTE | x, |
MorphLanguageEnum | Langua | ||
) |
References is_upper_alpha(), and is_upper_vowel().
Referenced by CLemmatizer::CheckAbbreviation().
bool is_lower_vowel | ( | BYTE | x, |
MorphLanguageEnum | Langua | ||
) |
References is_english_lower_vowel(), is_german_lower_vowel(), is_russian_lower_vowel(), morphEnglish, morphGerman, and morphRussian.
Referenced by MorphoWizard::slf_to_mrd(), and TransferReverseVowelNoToCharNo().
bool is_upper_vowel | ( | BYTE | x, |
MorphLanguageEnum | Langua | ||
) |
References is_english_upper_vowel(), is_german_upper_vowel(), is_russian_upper_vowel(), morphEnglish, morphGerman, and morphRussian.
Referenced by is_upper_consonant(), and TransferReverseVowelNoToCharNo().
bool is_english_alpha | ( | BYTE | x | ) |
References is_english_lower(), and is_english_upper().
Referenced by CheckLanguage(), CGraphmatFile::DealExtensionsAndLocalFileNames(), is_alpha(), is_generic_alpha(), and CUnitHolder::is_latin_alpha().
bool is_russian_alpha | ( | BYTE | x | ) |
References is_russian_lower(), and is_russian_upper().
Referenced by TItemContainer::CanBeRusAbbr(), TItemContainer::CanBeRusColloc(), CheckLanguage(), force_to_rus(), CGraphmatFile::InitNonContextDescriptors(), is_alpha(), TItemContainer::IsStandardRusLexeme(), and CGraLine::LengthUntilDelimiters().
bool is_german_alpha | ( | BYTE | x | ) |
References is_german_lower(), and is_german_upper().
Referenced by CheckLanguage(), is_alpha(), and CUnitHolder::is_latin_alpha().
bool is_alpha | ( | BYTE | x | ) |
References is_german_alpha(), and is_russian_alpha().
Referenced by InitAlphabet(), CGraLine::LengthUntilDelimiters(), NormalizeOborotStr(), and RmlPcreMakeTables().
bool is_alpha | ( | BYTE | x, |
MorphLanguageEnum | langua | ||
) |
References is_english_alpha(), is_generic_alpha(), is_german_alpha(), is_russian_alpha(), is_URL_alpha(), morphEnglish, morphGeneric, morphGerman, morphRussian, and morphURL.
bool is_lower_alpha | ( | BYTE | x, |
MorphLanguageEnum | langua | ||
) |
References is_english_lower(), is_generic_lower(), is_german_lower(), is_russian_lower(), morphEnglish, morphGeneric, morphGerman, morphRussian, and morphURL.
Referenced by AddFormsWithDifferentRegisters(), TItemContainer::CanBeRusAbbr(), TxCase::expand(), and RmlPcreMakeTables().
bool is_upper_alpha | ( | BYTE | x, |
MorphLanguageEnum | langua | ||
) |
References is_english_upper(), is_generic_upper(), is_german_upper(), is_russian_upper(), morphEnglish, morphGeneric, morphGerman, morphRussian, and morphURL.
Referenced by AbbrevIsEqualToString(), CreateMorphIndex(), TxMorph::expand(), GetWordForms(), InitAlphabet(), is_upper_consonant(), IsUpper(), MorphoWizard::ReadOnePrefixSet(), and RmlPcreMakeTables().
bool isnspace | ( | BYTE | x | ) |
References Azirkun, azirkun, Ccedille, ccedille, Eakut, eakut, Egravis, egravis, Ezirkun, ezirkun, Ntilda, ntilda, Ouml, ouml, Ozirkun, ozirkun, Uzirkun, and uzirkun.
Referenced by EngMakeUpper(), EngRusMakeUpper(), GerEngRusMakeUpperTemplate(), gtoupper(), and ReverseChar().
References Apostrophe, is_russian_lower(), LowerJO_cp1251, and UpperJO_cp1251.
Referenced by EngRusMakeUpper(), GerEngRusMakeUpperTemplate(), and ReverseChar().
References Apostrophe, is_russian_upper(), LowerJO_cp1251, and UpperJO_cp1251.
Referenced by EngRusMakeLower(), IsSuperEqualChar(), and ReverseChar().
References Auml, auml, etoupper(), is_english_lower(), Ouml, ouml, Uuml, and uuml.
Referenced by GerEngRusMakeUpperTemplate().
References Auml, auml, etolower(), is_english_upper(), Ouml, ouml, Uuml, and uuml.
Referenced by RmlMakeLower().
BYTE ReverseChar | ( | BYTE | ch, |
MorphLanguageEnum | langua | ||
) |
References Auml, auml, etolower(), etoupper(), is_english_lower(), is_english_upper(), is_russian_lower(), is_russian_upper(), morphEnglish, morphGeneric, morphGerman, Ouml, ouml, rtolower(), rtoupper(), Uuml, and uuml.
Referenced by AddFormsWithDifferentRegisters(), CompareWithoutRegister(), TxMorph::expand(), TxCase::expand(), GetWordForms(), CGraphmatFile::IsKey(), IsSuperEqualChar(), CGraphanDicts::ReadIdents(), and RmlPcreMakeTables().
string& EngMakeUpper | ( | string & | word | ) |
References etoupper(), is_english_lower(), and RegisterConverter().
Referenced by CQCount::countOptionsToString(), CConcSession::GetResultFormatByString(), CQFSort::toString(), CQFBiblSort::toString(), CQFContextSort::toString(), and CQFPrune::toString().
string& EngMakeLower | ( | string & | word | ) |
References etolower(), is_english_upper(), and RegisterConverter().
Referenced by CBiblIndex::AddBiblExpander(), GetLogLevel(), IsHtmlFile(), IsJsonFile(), IsTableFile(), newTermExpander(), and CDDCServerOptions::Set().
string& EngRusMakeLower | ( | string & | word | ) |
References etolower(), is_russian_upper(), and rtolower().
Referenced by RmlMakeLower().
char* RmlMakeUpper | ( | char * | word, |
MorphLanguageEnum | langua | ||
) |
References GerEngRusMakeUpperTemplate(), morphGeneric, and stoupper().
Referenced by AddFormsWithDifferentRegisters(), CQueryTokenNode::CreateThesPattern(), TxToUpper::expand(), TxCase::expand(), MorphoWizard::find_lemm(), CLemmatizer::LemmatizeWord(), NormalizeOborotStr(), ReadAbbrevationsFromOneFile(), CGraphanDicts::ReadENames(), CGraphanDicts::ReadKeyboard(), MorphoWizard::ReadOnePrefixSet(), and MorphoWizard::slf_to_mrd().
string& RmlMakeUpper | ( | string & | word, |
MorphLanguageEnum | langua | ||
) |
References GerEngRusMakeUpperTemplate(), morphGeneric, and stoupper().
string& RmlMakeLower | ( | string & | word, |
MorphLanguageEnum | langua | ||
) |
References EngRusMakeLower(), gtolower(), is_german_upper(), morphGeneric, morphGerman, RegisterConverter(), and stolower().
Referenced by AddFormsWithDifferentRegisters(), CQueryTokenNode::CreateLemmaPattern(), TxMorph::expand(), TxToLower::expand(), TxCase::expand(), MorphoWizard::get_lemm_string_with_accents(), CFormInfo::GetAccentedVowel(), GetWordForms(), CConcordance::LoadOptionsFromString(), MorphoWizard::mrd_to_slf(), and CBiblIndex::RegisterTextAreas().
string& EngRusMakeUpper | ( | string & | word | ) |
References etoupper(), is_russian_lower(), and rtoupper().
Referenced by GetLanguageByString(), and CGraphanDicts::ReadExtensions().
char* EngRusMakeUpper | ( | char * | word | ) |
References etoupper(), is_english_lower(), is_russian_lower(), and rtoupper().
bool IsRussian | ( | const char * | word | ) |
References CheckLanguage(), and morphRussian.
Referenced by TRoss::ReadFromStrWithOneSignatura().
bool CheckLanguage | ( | const char * | word, |
MorphLanguageEnum | langua | ||
) |
void ConvertJO2Je | ( | string & | src | ) |
void ConvertJO2Je | ( | char * | src, |
size_t | Length | ||
) |
References ConvertJO2JeTemplate().
Referenced by CLemmatizerRussian::FilterSrc(), CGraphmatFile::GraphmatMain(), and MorphoWizard::prepare_for_RML().
string ConvertASCIIToHtmlSymbols | ( | const string & | txt | ) |
Referenced by BuildHtmlHitStrWithHighlighting(), GenerateCountString(), and CConcSession::ShowBibliographyForTable().
T& RegisterConverter | ( | T & | word, |
size_t | Len, | ||
Pred | P, | ||
Conv | C | ||
) |
Referenced by EngMakeLower(), EngMakeUpper(), GerEngRusMakeUpperTemplate(), and RmlMakeLower().
T& GerEngRusMakeUpperTemplate | ( | T & | word, |
MorphLanguageEnum | Langua, | ||
size_t | Len | ||
) |
References etoupper(), gtoupper(), is_english_lower(), is_german_lower(), is_russian_lower(), morphGerman, RegisterConverter(), and rtoupper().
Referenced by CUnitHolder::BuildUnitBufferUpper(), and RmlMakeUpper().
const unsigned int _MAX_PATH = 512 |
Referenced by AddFile(), ConcIndexatorInvoker::BuildIndex(), and CreateTempFileName().
Referenced by CGraphmatFile::InitNonContextDescriptors().
Referenced by CGraLine::ReadWord().
Referenced by CGraLine::ReadWord().
Referenced by CGraLine::ReadWord().
Referenced by CGraLine::ReadWord().
Referenced by CGraLine::ReadWord().
Referenced by CUnitHolder::IsSentenceEndMark(), and CGraLine::ReadWord().
const BYTE UnknownPartOfSpeech = 0xff |
Referenced by CMorphDictBuilder::GenPredictIdx(), GetGramInfosFromWord(), CAgramtab::GetPartOfSpeech(), GetPredictionPartOfSpeech(), CAgramtab::GetTabStringByGramCode(), GetTagFromStr(), CLemmatizer::LemmatizeWord(), MorphoWizard::load_gramtab(), MorphoWizard::predict_lemm(), and CAgramtab::ProcessPOSAndGrammems().
const BYTE Auml = 196 |
Referenced by HTML::GetTextFromHTMLBuffer(), gtolower(), gtoupper(), and ReverseChar().
const BYTE auml = 228 |
Referenced by HTML::GetTextFromHTMLBuffer(), gtolower(), gtoupper(), and ReverseChar().
const BYTE Uuml = 220 |
Referenced by HTML::GetTextFromHTMLBuffer(), gtolower(), gtoupper(), and ReverseChar().
const BYTE uuml = 252 |
Referenced by HTML::GetTextFromHTMLBuffer(), gtolower(), gtoupper(), and ReverseChar().
const BYTE Ouml = 214 |
Referenced by etolower(), etoupper(), HTML::GetTextFromHTMLBuffer(), gtolower(), gtoupper(), and ReverseChar().
const BYTE ouml = 246 |
Referenced by etolower(), etoupper(), HTML::GetTextFromHTMLBuffer(), gtolower(), gtoupper(), and ReverseChar().
const BYTE szlig = 223 |
Referenced by HTML::GetTextFromHTMLBuffer(), and CGraphmatFile::InitNonContextDescriptors().
const BYTE Nu = 181 |
Referenced by CGraphmatFile::InitNonContextDescriptors().
const BYTE agrave = 224 |
Referenced by HTML::GetTextFromHTMLBuffer().
const BYTE egrave = 232 |
Referenced by HTML::GetTextFromHTMLBuffer().
const BYTE eacute = 233 |
Referenced by HTML::GetTextFromHTMLBuffer().
const BYTE LowerJO_cp1251 = 184 |
Referenced by ConvertJO2JeTemplate(), rtolower(), and rtoupper().
const BYTE UpperJO_cp1251 = 168 |
Referenced by ConvertJO2JeTemplate(), rtolower(), and rtoupper().
const BYTE LowerE_cp1251 = 229 |
Referenced by ConvertJO2JeTemplate().
const BYTE UpperE_cp1251 = 197 |
Referenced by ConvertJO2JeTemplate().
const BYTE Apostrophe = 39 |
Referenced by CGraLine::LengthUntilDelimiters(), rtolower(), and rtoupper().