#include <TextHandler.hpp>
Inheritance diagram for TextHandler:
Public Types | |
enum | TokenType { BEGINDOC = 1, ENDDOC = 2, WORD = 3, BEGINTAG = 4, ENDTAG = 5, SYMBOL = 6 } |
Public Methods | |
TextHandler () | |
virtual | ~TextHandler () |
virtual void | setTextHandler (TextHandler *th) |
Set the TextHandler that this TextHandler will pass information on to. | |
virtual TextHandler * | getTextHandler () |
Set the TextHandler that this TextHandler will pass information on to. | |
virtual void | foundToken (int type, char *token=NULL, char *orig=NULL, PropertyList *properties=NULL) |
virtual char * | handleBeginDoc (char *docno, char *original, PropertyList *list) |
virtual char * | handleEndDoc (char *token, char *original, PropertyList *list) |
virtual char * | handleWord (char *word, char *original, PropertyList *list) |
virtual char * | handleBeginTag (char *tag, char *original, PropertyList *list) |
Handle a begin tag. | |
virtual char * | handleEndTag (char *tag, char *original, PropertyList *list) |
Handle an end tag. | |
virtual char * | handleSymbol (char *symbol, char *original, PropertyList *list) |
virtual void | foundDoc (char *docno) |
Found a document with document number. | |
virtual void | foundDoc (char *docno, char *original) |
virtual void | foundWord (char *word) |
Found a word. | |
virtual void | foundWord (char *word, char *original) |
virtual void | foundEndDoc () |
Found end of doc. | |
virtual void | foundSymbol (char *sym) |
Found a word. | |
virtual char * | handleDoc (char *docno) |
Handle a doc. | |
virtual char * | handleWord (char *word) |
Handle a word, possibly transforming it. | |
virtual void | handleEndDoc () |
Handle the end of the doc. | |
virtual char * | handleSymbol (char *sym) |
Handle a word, possibly transforming it. | |
Protected Attributes | |
TextHandler * | textHandler |
The next textHandler in the chain. | |
char | buffer [MAXWORDSIZE] |
|
|
|
|
|
|
|
|
|
Found a document with document number.
|
|
Found end of doc.
|
|
Found a word.
|
|
|
|
|
|
Found a word.
|
|
Set the TextHandler that this TextHandler will pass information on to.
|
|
Handle a doc begin - default implementation calls handleDoc for backwords compat |
|
Handle a begin tag.
|
|
Handle a doc.
Reimplemented in DocFreqIndexer, FreqCounter, InvFPTextHandler, PropIndexTH, FlattextDocMgr, WriterInQueryHandler, and WriterTextHandler. |
|
Handle the end of the doc.
Reimplemented in DocFreqIndexer. |
|
Handle a doc end - default implementation calls old handleEndDoc for backwords compat |
|
Handle an end tag.
|
|
Handle a word, possibly transforming it.
Reimplemented in WriterInQueryHandler. |
|
Handle a symbol - default implementation calls old handleSymbol for backwords compat |
|
Handle a word, possibly transforming it.
Reimplemented in CtfIndexer, DocFreqIndexer, FreqCounter, InvFPTextHandler, QueryTextHandler, Stemmer, Stopper, WriterInQueryHandler, and WriterTextHandler. |
|
Handle a word - default implementation calls old handleWord for backwords compat Reimplemented in PropIndexTH, and BrillPOSTokenizer. |
|
Set the TextHandler that this TextHandler will pass information on to.
|
|
|
|
The next textHandler in the chain.
|