KJB
|
Classes | |
class | BankEdge |
struct | CharArrayEqualFunc |
struct | CharArrayHashFunc |
class | Edge |
class | EdgeLexer |
class | EdgeParser |
class | Exception |
class | HashMap |
class | Lexem |
class | Lexicon |
class | Model |
class | Pair |
class | Parameters |
class | RCObject |
class | RCIPtr |
class | StringMapEntry |
class | StringMap |
class | Tokenizer |
class | Trainer |
class | Pattern |
class | Tree |
class | Word |
Typedefs | |
typedef RCIPtr< BankEdge > | BankEdgePtr |
typedef std::list < spear::RCIPtr< BankEdge > > | BankEdgeList |
typedef std::list < spear::RCIPtr< BankEdge > >::const_reverse_iterator | BankEdgeListConstRevIter |
typedef std::list < spear::RCIPtr< BankEdge > >::const_iterator | BankEdgeListConstIter |
typedef struct spear::CharArrayEqualFunc | CharArrayEqualFunc |
typedef struct spear::CharArrayHashFunc | CharArrayHashFunc |
typedef RCIPtr< Edge > | EdgePtr |
typedef RCIPtr< spear::Lexem > | LexemPtr |
typedef RCIPtr< spear::Lexicon > | LexiconPtr |
typedef RCIPtr< Model > | ModelPtr |
typedef RCIPtr< Tokenizer > | TokenizerPtr |
typedef RCIPtr< spear::Trainer > | TrainerPtr |
typedef RCIPtr< Pattern > | PatternPtr |
typedef RCIPtr< spear::Tree > | TreePtr |
Enumerations | |
enum | PatternType { PATTERN_OBJ, PATTERN_IOBJ, PATTERN_SUBJ, PATTERN_PREP, PATTERN_ROBJ, PATTERN_RIOBJ, PATTERN_RSUBJ } |
enum | VerbType { VERB_ACTIVE, VERB_PASSIVE, VERB_COPULATIVE, VERB_INFINITIVE, VERB_GERUND } |
Functions | |
bool | compareWideCharToWideChar (const Char *s1, const Char *s2) |
void | simpleTokenize (const String &input, std::vector< String > &output, const String &separators) |
void | tokenizeWithQuotes (const String &input, std::vector< String > &output, const String &separators) |
String | quotify (const String &str) |
int | toInteger (const String &s) |
bool | isNumber (const String &s) |
bool | isNumberRange (const String &s) |
String | toUpper (const String &s) |
String | toLower (const String &s) |
bool | expandNumber (const String &number, std::vector< String > &expansion) |
String | mergeStrings (const String &s1, const String &s2) |
String | mergeStrings (const String &s1, const String &s2, const String &s3) |
String | mergeStrings (const String &s1, const String &s2, const String &s3, const String &s4) |
bool | startsWith (const String &big, const String &small) |
bool | endsWith (const String &big, const String &small) |
String | stripString (const String &s, int left, int right) |
template<typename T > | |
spear::RCIPtr< T > | findHead (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | traverseRightToLeft (const std::list< spear::RCIPtr< T > > &children, const Char *labels[], bool traverseLabelsFirst=true) |
template<typename T > | |
spear::RCIPtr< T > | traverseLeftToRight (const std::list< spear::RCIPtr< T > > &children, const Char *labels[], bool traverseLabelsFirst=true) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishNP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishADJP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishADVP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishCONJP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishFRAG (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishINTJ (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishLST (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishNAC (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishPP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishPRN (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishQP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishRRC (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishS (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishSBAR (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishSBARQ (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishSINV (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishSQ (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishUCP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishVP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishWHADJP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishWHADVP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishWHNP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishWHPP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishTOP (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishX (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglishNoCoord (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
TCRI | isCoordinatedHead (const std::list< spear::RCIPtr< T > > &children, TCRI current) |
template<typename T > | |
spear::RCIPtr< T > | findHeadEnglish (const String &parent, const std::list< spear::RCIPtr< T > > &children) |
template<typename T > | |
bool | operator== (const RCIPtr< T > &pointer, const RCIPtr< T > &other) |
template<typename T > | |
bool | operator!= (const RCIPtr< T > &pointer, const RCIPtr< T > &other) |
template<typename T > | |
bool | operator== (const RCIPtr< T > &pointer, const T *other) |
template<typename T > | |
bool | operator== (const T *other, const RCIPtr< T > &pointer) |
template<typename T > | |
bool | operator!= (const RCIPtr< T > &pointer, const T *other) |
template<typename T > | |
bool | operator!= (const T *other, const RCIPtr< T > &pointer) |
void | print_filename (const std::string &s, std::ostream &os) |
void | train_collins (const std::string &input_filename, const std::string &output_dir, const int &lf_thresh, std::ostream &os) |
Variables | |
size_t | LF_WORD_THRESHOLD = 6 |
typedef std::list< spear::RCIPtr<BankEdge> > spear::BankEdgeList |
typedef std::list< spear::RCIPtr<BankEdge> >::const_iterator spear::BankEdgeListConstIter |
typedef std::list< spear::RCIPtr<BankEdge> >::const_reverse_iterator spear::BankEdgeListConstRevIter |
typedef RCIPtr<BankEdge> spear::BankEdgePtr |
typedef struct spear::CharArrayEqualFunc spear::CharArrayEqualFunc |
typedef struct spear::CharArrayHashFunc spear::CharArrayHashFunc |
typedef RCIPtr<Edge> spear::EdgePtr |
typedef RCIPtr<spear::Lexem> spear::LexemPtr |
typedef RCIPtr<spear::Lexicon> spear::LexiconPtr |
typedef RCIPtr<Model> spear::ModelPtr |
typedef RCIPtr<Pattern> spear::PatternPtr |
typedef RCIPtr<Tokenizer> spear::TokenizerPtr |
typedef RCIPtr<spear::Trainer> spear::TrainerPtr |
typedef RCIPtr<spear::Tree> spear::TreePtr |
enum spear::PatternType |
enum spear::VerbType |
Expands numbers/fractions/ranges to their alphabetical representation E.g. "113" ==> "one hundred thirteen"
spear::RCIPtr<T> spear::findHead | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
This function implements the head finding heuristics The type T can be any edge type that implements the following methods: const std::wstring & T::getLabel() const
spear::RCIPtr<T> spear::findHeadEnglish | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishADJP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishADVP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishCONJP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishFRAG | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishINTJ | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishLST | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishNAC | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishNoCoord | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishNP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishPP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishPRN | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishQP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishRRC | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishS | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishSBAR | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishSBARQ | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishSINV | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishSQ | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishTOP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishUCP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishVP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishWHADJP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishWHADVP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishWHNP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishWHPP | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
spear::RCIPtr<T> spear::findHeadEnglishX | ( | const String & | parent, |
const std::list< spear::RCIPtr< T > > & | children | ||
) |
TCRI spear::isCoordinatedHead | ( | const std::list< spear::RCIPtr< T > > & | children, |
TCRI | current | ||
) |
bool spear::isNumber | ( | const String & | s | ) |
Returns true if this is an integer, real, or fraction number
bool spear::isNumberRange | ( | const String & | s | ) |
Returns true if this is a number range, e.g. "N-M"
String spear::mergeStrings | ( | const String & | s1, |
const String & | s2, | ||
const String & | s3, | ||
const String & | s4 | ||
) |
|
inline |
|
inline |
|
inline |
|
inline |
|
inline |
|
inline |
void spear::print_filename | ( | const std::string & | s, |
std::ostream & | os | ||
) |
Constructs a valid quote-surrounded token All inside quotes are preceded by \
void spear::simpleTokenize | ( | const String & | input, |
std::vector< String > & | output, | ||
const String & | separators | ||
) |
int spear::toInteger | ( | const String & | s | ) |
void spear::tokenizeWithQuotes | ( | const String & | input, |
std::vector< String > & | output, | ||
const String & | separators | ||
) |
String tokenization, considering everything within quotes as 1 token Regular quotes inside tokens MUST be preceded by \
void spear::train_collins | ( | const std::string & | input_filename, |
const std::string & | output_dir, | ||
const int & | lf_thresh, | ||
std::ostream & | os | ||
) |
spear::RCIPtr<T> spear::traverseLeftToRight | ( | const std::list< spear::RCIPtr< T > > & | children, |
const Char * | labels[], | ||
bool | traverseLabelsFirst = true |
||
) |
spear::RCIPtr<T> spear::traverseRightToLeft | ( | const std::list< spear::RCIPtr< T > > & | children, |
const Char * | labels[], | ||
bool | traverseLabelsFirst = true |
||
) |
size_t spear::LF_WORD_THRESHOLD = 6 |