#include <InvIndex.hpp>
Inheritance diagram for InvIndex:
Public Methods | |
InvIndex () | |
InvIndex (const string &indexName) | |
~InvIndex () | |
void | setMesgStream (ostream *lemStream) |
set the mesg stream | |
Open index | |
bool | open (const string &indexName) |
Open previously created Index with given prefix, return true if opened successfully. | |
Spelling and index conversion | |
TERMID_T | term (const TERM_T &word) const |
Convert a term spelling to a termID. | |
const TERM_T | term (TERMID_T termID) const |
Convert a termID to its spelling. | |
DOCID_T | document (const EXDOCID_T &docIDStr) const |
Convert a spelling to docID. | |
const EXDOCID_T | document (DOCID_T docID) const |
Convert a docID to its spelling. | |
const DocumentManager * | docManager (DOCID_T docID) const |
Summary counts | |
COUNT_T | docCount () const |
Total count (i.e., number) of documents in collection. | |
COUNT_T | termCountUnique () const |
Total count of unique terms in collection. | |
COUNT_T | termCount (TERMID_T termID) const |
Total counts of a term in collection. | |
COUNT_T | termCount () const |
Total counts of all terms in collection. | |
float | docLengthAvg () const |
Average document length. | |
COUNT_T | docCount (TERMID_T termID) const |
Total counts of doc with a given term. | |
COUNT_T | docLength (DOCID_T docID) const |
Total counts of terms in a document, including stop words. | |
virtual COUNT_T | docLengthCounted (DOCID_T docID) const |
Total count of terms in given document, not including stop words. | |
Index entry access | |
DocInfoList * | docInfoList (TERMID_T termID) const |
doc entries in a term index,
| |
TermInfoList * | termInfoList (DOCID_T docID) const |
word entries in a document index (bag of words),
| |
Protected Methods | |
bool | fullToc (const string &fileName) |
readin all toc | |
bool | indexLookup () |
readin index lookup table | |
bool | invFileIDs () |
readin inverted index filenames map | |
bool | docMgrIDs () |
read in document manager internal and external ids map | |
bool | dtLookup () |
read in dt index lookup table of format ver1.9 (and up?) | |
bool | dtLookup_ver1 () |
read in dt index lookup table of format older than ver1.9 | |
bool | dtFileIDs () |
read in dt index filenames map | |
bool | termIDs () |
read in termIDs to term spelling map | |
bool | docIDs () |
read in docIDs to doc spelling map | |
Protected Attributes | |
LOC_T * | counts |
string * | names |
float | aveDocLen |
inv_entry * | lookup |
dt_entry * | dtlookup |
int | dtloaded |
TERM_T * | terms |
EXDOCID_T * | docnames |
string * | dtfiles |
ifstream * | dtfstreams |
string * | invfiles |
ifstream * | invfstreams |
vector< DocumentManager * > | docmgrs |
map< TERM_T, TERMID_T, less< TERM_T > > | termtable |
map< EXDOCID_T, DOCID_T, less< EXDOCID_T > > | doctable |
ostream * | msgstream |
|
|
|
|
|
|
|
Total counts of doc with a given term.
Implements Index. |
|
Total count (i.e., number) of documents in collection.
Implements Index. |
|
read in docIDs to doc spelling map
|
|
doc entries in a term index,
Implements Index. Reimplemented in InvFPIndex. |
|
Total counts of terms in a document, including stop words.
Implements Index. |
|
Average document length.
Implements Index. |
|
Total count of terms in given document, not including stop words.
Reimplemented in InvFPIndex. |
|
A String identifier for the document manager to get at the source of the document with this document id Reimplemented from Index. |
|
read in document manager internal and external ids map
|
|
Convert a docID to its spelling.
Implements Index. |
|
Convert a spelling to docID.
Implements Index. |
|
read in dt index filenames map
|
|
read in dt index lookup table of format ver1.9 (and up?)
|
|
read in dt index lookup table of format older than ver1.9
|
|
readin all toc
|
|
readin index lookup table
|
|
readin inverted index filenames map
|
|
Open previously created Index with given prefix, return true if opened successfully.
Implements Index. |
|
set the mesg stream
|
|
Convert a termID to its spelling.
Implements Index. |
|
Convert a term spelling to a termID.
Implements Index. |
|
Total counts of all terms in collection.
Implements Index. |
|
Total counts of a term in collection.
Implements Index. |
|
Total count of unique terms in collection.
Implements Index. |
|
read in termIDs to term spelling map
|
|
word entries in a document index (bag of words),
Implements Index. Reimplemented in InvFPIndex. |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|