|
Public Member Functions |
| IndexEnvironment () |
| ~IndexEnvironment () |
void | setOffsetAnnotationsPath (const std::string &offsetAnnotationsRoot) |
void | setOffsetMetadataPath (const std::string &offsetMetadataRoot) |
void | setAnchorTextPath (const std::string &anchorTextRoot) |
void | setDocumentRoot (const std::string &documentRoot) |
void | addFileClass (const std::string &name, const std::string &iterator, const std::string &parser, const std::string &tokenizer, const std::string &startDocTag, const std::string &endDocTag, const std::string &endMetadataTag, const std::vector< std::string > &include, const std::vector< std::string > &exclude, const std::vector< std::string > &index, const std::vector< std::string > &metadata, const std::map< indri::parse::ConflationPattern *, std::string > &conflations) |
indri::parse::FileClassEnvironmentFactory::Specification * | getFileClassSpec (const std::string &name) |
void | addFileClass (const indri::parse::FileClassEnvironmentFactory::Specification &spec) |
void | setIndexedFields (const std::vector< std::string > &fieldNames) |
void | setNumericField (const std::string &fieldName, bool isNumeric, const std::string &parserName="") |
void | setOrdinalField (const std::string &fieldName, bool isOrdinal) |
void | setParentalField (const std::string &fieldName, bool isParental) |
void | setMetadataIndexedFields (const std::vector< std::string > &forwardFieldNames, const std::vector< std::string > &backwardFieldNames) |
void | setStopwords (const std::vector< std::string > &stopwords) |
void | setStemmer (const std::string &stemmer) |
void | setMemory (UINT64 memory) |
void | setNormalization (bool flag) |
void | setStoreDocs (bool flag) |
void | setOffsetAnnotationIndexHint (indri::parse::OffsetAnnotationIndexHint hintType) |
void | create (const std::string &repositoryPath, IndexStatus *callback=0) |
void | open (const std::string &repositoryPath, IndexStatus *callback=0) |
void | close () |
| close the index and repository
|
void | addFile (const std::string &fileName) |
void | addFile (const std::string &fileName, const std::string &fileClass) |
lemur::api::DOCID_T | addString (const std::string &documentString, const std::string &fileClass, const std::vector< indri::parse::MetadataPair > &metadata) |
lemur::api::DOCID_T | addString (const std::string &documentString, const std::string &fileClass, const std::vector< indri::parse::MetadataPair > &metadata, const std::vector< indri::parse::TagExtent * > &tags) |
lemur::api::DOCID_T | addParsedDocument (ParsedDocument *document) |
void | deleteDocument (lemur::api::DOCID_T documentID) |
int | documentsIndexed () |
| Returns the number of documents indexed so far in this session.
|
int | documentsSeen () |
void | compact () |
Static Public Member Functions |
void | merge (const std::string &outputIndex, const std::vector< std::string > &inputIndexes) |
Private Member Functions |
void | _getParsingContext (indri::parse::Parser **parser, indri::parse::Tokenizer **tokenizer, indri::parse::DocumentIterator **iterator, indri::parse::Conflater **conflater, const std::string &extension) |
std::vector< indri::parse::Transformation * > | _createAnnotators (const std::string &fileName, const std::string &fileClass, indri::parse::Conflater **conflater) |
ParsedDocument * | _applyAnnotators (std::vector< indri::parse::Transformation * > &annotators, ParsedDocument *parsed) |
Private Attributes |
IndexStatus * | _callback |
Parameters * | _options |
std::string | _repositoryPath |
indri::collection::Repository | _repository |
int | _documents |
std::string | _error |
std::string | _offsetAnnotationsRoot |
std::string | _offsetMetadataRoot |
std::string | _anchorTextRoot |
std::string | _documentRoot |
Parameters | _parameters |
indri::parse::FileClassEnvironmentFactory | _fileClassFactory |
indri::parse::AnchorTextAnnotator | _annotator |
indri::parse::OffsetAnnotationAnnotator | _oa_annotator |
indri::parse::OffsetMetadataAnnotator | _om_annotator |
std::map< std::string, indri::parse::FileClassEnvironment * > | _environments |
int | _documentsIndexed |
int | _documentsSeen |
Friends |
class | QueryEnvironment |