moot.h
Go to the documentation of this file.
1 /* -*- Mode: C++ -*- */
2 /*
3  libmoot : moocow's part-of-speech tagging library
4  Copyright (C) 2003-2014 by Bryan Jurish <moocow@cpan.org>
5 
6  This library is free software; you can redistribute it and/or
7  modify it under the terms of the GNU Lesser General Public
8  License as published by the Free Software Foundation; either
9  version 3 of the License, or (at your option) any later version.
10 
11  This library is distributed in the hope that it will be useful,
12  but WITHOUT ANY WARRANTY; without even the implied warranty of
13  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  Lesser General Public License for more details.
15 
16  You should have received a copy of the GNU Lesser General Public
17  License along with this library; if not, write to the Free Software
18  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19 */
20 
21 /*--------------------------------------------------------------------------
22  * File: moot.h
23  * Author: Bryan Jurish <moocow@cpan.org>
24  * Description:
25  * + moot PoS tagger : top level headers
26  *--------------------------------------------------------------------------*/
27 
33 #ifndef _MOOT_H
34 #define _MOOT_H
35 
36 /*----------------------------------------------------------------------
37  * autoheader configuration (safe)
38  */
39 #include <mootConfig.h>
40 
41 //----------------------------------------------------------------------
42 // Top-Level includes
43 #include <mootHMMTrainer.h> /*-- tagger model training --*/
44 #include <mootHMM.h> /*-- runtime tagging --*/
45 #include <mootDynHMM.h> /*-- runtime tagging, dynamic model --*/
46 #include <mootEval.h> /*-- tagger output evaluation --*/
47 
48 //----------------------------------------------------------------------
49 // Low-level utilties
50 #include <mootSTLHacks.h>
51 #include <mootTypes.h>
52 #include <mootUtils.h>
53 #include <mootModelSpec.h>
54 #include <mootEnum.h>
55 
56 //----------------------------------------------------------------------
57 // Low-level I/O
58 #include <mootIO.h>
59 #include <mootCIO.h>
60 #include <mootZIO.h>
61 #include <mootCxxIO.h>
62 #include <mootBufferIO.h>
63 #include <mootBinIO.h>
64 
65 //----------------------------------------------------------------------
66 // mootToken I/O
67 #include <mootToken.h>
68 #include <mootFlavor.h>
69 #include <mootTokenIO.h>
70 #include <mootGenericLexer.h>
71 #include <mootPPLexer.h>
72 #include <mootTokenLexer.h>
73 #include <mootRecode.h>
74 #include <mootExpatParser.h>
75 #include <mootTokenExpatIO.h>
76 #include <mootXmlDoc.h>
77 #include <mootTokenXmlDoc.h>
78 
79 //----------------------------------------------------------------------
80 // lexical-class frequency tables
81 #include <mootClassfreqs.h>
82 #include <mootClassfreqsLexer.h>
83 #include <mootClassfreqsParser.h>
84 #include <mootClassfreqsCompiler.h>
85 
86 //----------------------------------------------------------------------
87 // lexical frequency tables
88 #include <mootLexfreqsCompiler.h>
89 #include <mootLexfreqs.h>
90 #include <mootLexfreqsLexer.h>
91 #include <mootLexfreqsParser.h>
92 
93 //----------------------------------------------------------------------
94 // n-gram frequency tables
95 #include <mootNgramsCompiler.h>
96 #include <mootNgrams.h>
97 #include <mootNgramsLexer.h>
98 #include <mootNgramsParser.h>
99 
100 //----------------------------------------------------------------------
101 // Suffix tries (buggy: avoid!)
102 #include <mootAssocVector.h>
103 #include <mootTrieVector.h>
104 #include <mootSuffixTrie.h>
105 
106 //----------------------------------------------------------------------
107 // WASTE tokenization framework
108 #include <wasteTypes.h>
109 #include <wasteCase.h>
110 #include <wasteScanner.h>
111 #include <wasteLexicon.h>
112 #include <wasteLexer.h>
113 #include <wasteDecoder.h>
114 #include <wasteAnnotator.h>
115 #include <wasteTrainWriter.h>
116 
117 #endif /* _MOOT_H */
flex++ lexical-class-frequency parameter file lexer: autogenerated header
case-folding operation(s) for UTF-8 strings
flex++ n-gram frequency parameter file lexer: autogenerated header
useful utilities, especially for command-line programs
HMM training data: lexical-class frequencies: raw.
Hidden Markov Model tagger/disambiguator.
routines for tagger evaluation with respect to a test set
bison++ lexical-class-frequency parameter file parser: autogenerated header
mootio abstraction layer for C FILE*s
flex++ raw-text lexer: autogenerated header
interface to librecode (optional)
broken libxml2 support for mootToken I/O
safely includes autoheader preprocessor macros
flex++ lexer for moot::TokenReaderNative guts: autogenerated headers
classes and utilities for tokens and associated analyses
flex++ lexical-frequency parameter file lexer: autogenerated header
TokenWriter wrapper class for writing WASTE tokenizer &#39;well-done&#39; training data from pre-tokenized in...
mootio I/O abstraction layer for zlib gzFile
common utilities for flex++ lexers
classes and utilities for regex-based token "flavor" heuristics
HMM training data: lexical frequencies: raw.
abstract templates for binary I/O
utilities for model specification
Common definitions for WASTE HMM-based tokenizer.
various STL and namespace-related hacks
C++ wrapper class for libxml2 tree-mode XML documents (optional)
trie implementation using std::vector<> for underlying storage
mootio abstraction layer for C++ streams
Compiler for lexical-frequency parameter files.
Abstract and native classes for I/O of moot::mootToken objects.
Declarations of the mid level lexer for the waste tokenizer.
runtime enumerations (1-1 maps: symbolic identifiers <-> unsigned integers)
Compiler for lexical-class-frequency parameter files.
mootio abstraction layer for C char* buffers
Hidden Markov Model tagger/disambiguator: training routines.
generic I/O abstraction layer
bison++ n-gram frequency parameter file parser: autogenerated header
suffix tries (experimental, optional)
moot::TokenIO abstraction layer for XML I/O via expat (optional)
Common typedefs and constants.
Declarations of the low level scanner for the waste tokenizer.
bison++ lexical-frequency parameter file parser: autogenerated header
HMM training data: n-gram frequencies: raw.
C++ wrapper class for generic expat XML parsers (optional)
simple hash_set<>-based lexicon class for moot::wasteLexer
Hidden Markov Model tagger/disambiguator for dynamic lexical probabilities.
LISP-style assoc vectors.
simple hash_set<>-based lexicon class for moot::wasteLexer
Compiler for n-gram frequency parameter files.