|
Public Member Functions |
| | IndexEnvironment () |
| | ~IndexEnvironment () |
| void | setOffsetAnnotationsPath (const std::string &offsetAnnotationsRoot) |
| void | setOffsetMetadataPath (const std::string &offsetMetadataRoot) |
| void | setAnchorTextPath (const std::string &anchorTextRoot) |
| void | setDocumentRoot (const std::string &documentRoot) |
| void | addFileClass (const std::string &name, const std::string &iterator, const std::string &parser, const std::string &tokenizer, const std::string &startDocTag, const std::string &endDocTag, const std::string &endMetadataTag, const std::vector< std::string > &include, const std::vector< std::string > &exclude, const std::vector< std::string > &index, const std::vector< std::string > &metadata, const std::map< indri::parse::ConflationPattern *, std::string > &conflations) |
| indri::parse::FileClassEnvironmentFactory::Specification * | getFileClassSpec (const std::string &name) |
| void | addFileClass (const indri::parse::FileClassEnvironmentFactory::Specification &spec) |
| void | setIndexedFields (const std::vector< std::string > &fieldNames) |
| void | setNumericField (const std::string &fieldName, bool isNumeric, const std::string &parserName="") |
| void | setOrdinalField (const std::string &fieldName, bool isOrdinal) |
| void | setParentalField (const std::string &fieldName, bool isParental) |
| void | setMetadataIndexedFields (const std::vector< std::string > &forwardFieldNames, const std::vector< std::string > &backwardFieldNames) |
| void | setStopwords (const std::vector< std::string > &stopwords) |
| void | setStemmer (const std::string &stemmer) |
| void | setMemory (UINT64 memory) |
| void | setNormalization (bool flag) |
| void | setStoreDocs (bool flag) |
| void | setOffsetAnnotationIndexHint (indri::parse::OffsetAnnotationIndexHint hintType) |
| void | create (const std::string &repositoryPath, IndexStatus *callback=0) |
| void | open (const std::string &repositoryPath, IndexStatus *callback=0) |
| void | close () |
| | close the index and repository
|
| void | addFile (const std::string &fileName) |
| void | addFile (const std::string &fileName, const std::string &fileClass) |
| lemur::api::DOCID_T | addString (const std::string &documentString, const std::string &fileClass, const std::vector< indri::parse::MetadataPair > &metadata) |
| lemur::api::DOCID_T | addString (const std::string &documentString, const std::string &fileClass, const std::vector< indri::parse::MetadataPair > &metadata, const std::vector< indri::parse::TagExtent * > &tags) |
| lemur::api::DOCID_T | addParsedDocument (ParsedDocument *document) |
| void | deleteDocument (lemur::api::DOCID_T documentID) |
| int | documentsIndexed () |
| | Returns the number of documents indexed so far in this session.
|
| int | documentsSeen () |
| void | compact () |
Static Public Member Functions |
| void | merge (const std::string &outputIndex, const std::vector< std::string > &inputIndexes) |
Private Member Functions |
| void | _getParsingContext (indri::parse::Parser **parser, indri::parse::Tokenizer **tokenizer, indri::parse::DocumentIterator **iterator, indri::parse::Conflater **conflater, const std::string &extension) |
| std::vector< indri::parse::Transformation * > | _createAnnotators (const std::string &fileName, const std::string &fileClass, indri::parse::Conflater **conflater) |
| ParsedDocument * | _applyAnnotators (std::vector< indri::parse::Transformation * > &annotators, ParsedDocument *parsed) |
Private Attributes |
| IndexStatus * | _callback |
| Parameters * | _options |
| std::string | _repositoryPath |
| indri::collection::Repository | _repository |
| int | _documents |
| std::string | _error |
| std::string | _offsetAnnotationsRoot |
| std::string | _offsetMetadataRoot |
| std::string | _anchorTextRoot |
| std::string | _documentRoot |
| Parameters | _parameters |
| indri::parse::FileClassEnvironmentFactory | _fileClassFactory |
| indri::parse::AnchorTextAnnotator | _annotator |
| indri::parse::OffsetAnnotationAnnotator | _oa_annotator |
| indri::parse::OffsetMetadataAnnotator | _om_annotator |
| std::map< std::string, indri::parse::FileClassEnvironment * > | _environments |
| int | _documentsIndexed |
| int | _documentsSeen |
Friends |
| class | QueryEnvironment |