#include <TextHandler.hpp>
Inheritance diagram for TextHandler:

Public Types | |
| enum | TokenType { BEGINDOC = 1, ENDDOC = 2, WORD = 3, BEGINTAG = 4, ENDTAG = 5, SYMBOL = 6 } |
Public Methods | |
| TextHandler () | |
| virtual | ~TextHandler () |
| virtual void | setTextHandler (TextHandler *th) |
| Set the TextHandler that this TextHandler will pass information on to. | |
| virtual TextHandler * | getTextHandler () |
| Set the TextHandler that this TextHandler will pass information on to. | |
| virtual void | foundToken (int type, char *token=NULL, char *orig=NULL, PropertyList *properties=NULL) |
| virtual char * | handleBeginDoc (char *docno, char *original, PropertyList *list) |
| virtual char * | handleEndDoc (char *token, char *original, PropertyList *list) |
| virtual char * | handleWord (char *word, char *original, PropertyList *list) |
| virtual char * | handleBeginTag (char *tag, char *original, PropertyList *list) |
| Handle a begin tag. | |
| virtual char * | handleEndTag (char *tag, char *original, PropertyList *list) |
| Handle an end tag. | |
| virtual char * | handleSymbol (char *symbol, char *original, PropertyList *list) |
| virtual void | foundDoc (char *docno) |
| Found a document with document number. | |
| virtual void | foundDoc (char *docno, char *original) |
| virtual void | foundWord (char *word) |
| Found a word. | |
| virtual void | foundWord (char *word, char *original) |
| virtual void | foundEndDoc () |
| Found end of doc. | |
| virtual void | foundSymbol (char *sym) |
| Found a word. | |
| virtual char * | handleDoc (char *docno) |
| Handle a doc. | |
| virtual char * | handleWord (char *word) |
| Handle a word, possibly transforming it. | |
| virtual void | handleEndDoc () |
| Handle the end of the doc. | |
| virtual char * | handleSymbol (char *sym) |
| Handle a word, possibly transforming it. | |
Protected Attributes | |
| TextHandler * | textHandler |
| The next textHandler in the chain. | |
| char | buffer [MAXWORDSIZE] |
|
|
|
|
|
|
|
|
|
|
||||||||||||
|
|
|
|
Found a document with document number.
|
|
|
Found end of doc.
|
|
|
Found a word.
|
|
||||||||||||||||||||
|
|
|
||||||||||||
|
|
|
|
Found a word.
|
|
|
Set the TextHandler that this TextHandler will pass information on to.
|
|
||||||||||||||||
|
Handle a doc begin - default implementation calls handleDoc for backwords compat |
|
||||||||||||||||
|
Handle a begin tag.
|
|
|
Handle a doc.
Reimplemented in DocFreqIndexer, FreqCounter, InvFPTextHandler, PropIndexTH, FlattextDocMgr, WriterInQueryHandler, and WriterTextHandler. |
|
|
Handle the end of the doc.
Reimplemented in DocFreqIndexer. |
|
||||||||||||||||
|
Handle a doc end - default implementation calls old handleEndDoc for backwords compat |
|
||||||||||||||||
|
Handle an end tag.
|
|
|
Handle a word, possibly transforming it.
Reimplemented in WriterInQueryHandler. |
|
||||||||||||||||
|
Handle a symbol - default implementation calls old handleSymbol for backwords compat |
|
|
Handle a word, possibly transforming it.
Reimplemented in CtfIndexer, DocFreqIndexer, FreqCounter, InvFPTextHandler, QueryTextHandler, Stemmer, Stopper, WriterInQueryHandler, and WriterTextHandler. |
|
||||||||||||||||
|
Handle a word - default implementation calls old handleWord for backwords compat Reimplemented in PropIndexTH, and BrillPOSTokenizer. |
|
|
Set the TextHandler that this TextHandler will pass information on to.
|
|
|
|
|
|
The next textHandler in the chain.
|
1.2.18