#include <InvPushIndex.hpp>
Inheritance diagram for InvPushIndex:

Public Methods | |
| InvPushIndex (char *prefix="DefaultIndex",int cachesize=128000000,long maxfilesize=2100000000,DOCID_T startdocid=1) | |
| ~InvPushIndex () | |
| void | setName (char *prefix) |
| sets the name for this index. the name will be the prefix for all files related to this index. | |
| bool | beginDoc (DocumentProps *dp) |
| the beginning of a new document, returns true if initiation was successful. | |
| bool | addTerm (Term &t) |
| adding a term to the current document, returns true if term was added successfully. | |
| void | endDoc (DocumentProps *dp) |
| signify the end of current document. | |
| virtual void | endDoc (DocumentProps *dp,const char *mgr) |
| signify the end of current document and associate with certain document manager. this doesn't change the mgr that was previously set. | |
| void | endCollection (CollectionProps *cp) |
| signify the end of this collection. properties passed at the beginning of a collection should be handled by the constructor. | |
| void | setDocManager (const char *mgrID) |
| set the document manager to use for succeeding documents. | |
Protected Methods | |
| void | writeTOC (int numinv) |
| void | writeDocIDs () |
| void | writeCache () |
| void | lastWriteCache () |
| void | writeDTIDs () |
| void | writeDocMgrIDs () |
| int | docMgrID (const char *mgr) |
| returns the internal id of given docmgr if not already registered, mgr will be added. | |
| virtual void | doendDoc (DocumentProps *dp,int mgrid) |
Protected Attributes | |
| long | maxfile |
| MemCache* | cache |
| the biggest our file size can be. | |
| vector<char*> | docIDs |
| the main memory handler for building. | |
| vector<char*> | termIDs |
| list of external docids in internal docid order. | |
| vector<char*> | tempfiles |
| list of terms in termid order. | |
| vector<char*> | dtfiles |
| list of tempfiles we've written to flush cache. | |
| vector<char*> | docmgrs |
| list of dt index files. | |
| FILE* | writetlookup |
| ofstream | writetlist |
| filestream for writing the lookup table to the docterm db. | |
| int | tcount |
| filestream for writing the list of located terms for each document. | |
| int | tidcount |
| count of total terms. | |
| int | dtidcount |
| count of unique terms. | |
| char* | name |
| count of unique terms in a current doc. | |
| int | namelen |
| the prefix name. | |
| TABLE_T | wordtable |
| the length of the name (avoid many calls to strlen). | |
| map<int, int> | termlist |
| table of all terms and their doclists. | |
| int* | membuf |
| maps of terms and freqs. | |
| int | membufsize |
| memory to use for cache and buffers. | |
| int | curdocmgr |
|
|
|
|
|
|
|
|
adding a term to the current document, returns true if term was added successfully.
Reimplemented from PushIndex. Reimplemented in InvFPPushIndex. |
|
|
the beginning of a new document, returns true if initiation was successful.
Reimplemented from PushIndex. |
|
|
returns the internal id of given docmgr if not already registered, mgr will be added.
|
|
|
Reimplemented in InvFPPushIndex. |
|
|
signify the end of this collection. properties passed at the beginning of a collection should be handled by the constructor.
Reimplemented from PushIndex. Reimplemented in InvFPPushIndex. |
|
|
signify the end of current document and associate with certain document manager. this doesn't change the mgr that was previously set.
|
|
|
signify the end of current document.
Reimplemented from PushIndex. |
|
|
|
|
|
set the document manager to use for succeeding documents.
Reimplemented from PushIndex. |
|
|
sets the name for this index. the name will be the prefix for all files related to this index.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
Reimplemented in InvFPPushIndex. |
|
|
the biggest our file size can be.
|
|
|
|
|
|
the main memory handler for building.
|
|
|
list of dt index files.
|
|
|
list of tempfiles we've written to flush cache.
|
|
|
count of unique terms.
|
|
|
|
|
|
maps of terms and freqs.
|
|
|
memory to use for cache and buffers.
|
|
|
count of unique terms in a current doc.
|
|
|
the prefix name.
|
|
|
filestream for writing the list of located terms for each document.
|
|
|
list of terms in termid order.
|
|
|
list of external docids in internal docid order.
|
|
|
table of all terms and their doclists.
Reimplemented in InvFPPushIndex. |
|
|
count of total terms.
|
|
|
the length of the name (avoid many calls to strlen).
|
|
|
filestream for writing the lookup table to the docterm db.
|
|
|
|
1.2.4 written by Dimitri van Heesch,
© 1997-2000