|
Public Member Functions |
| | OffsetAnnotationAnnotator (Conflater *p_conflater) |
| | OffsetAnnotationAnnotator () |
| | ~OffsetAnnotationAnnotator () |
| void | setTags (const char *docno, const std::vector< indri::parse::TagExtent * > &tagset) |
| void | setConflater (Conflater *p_conflater) |
| void | setHandler (ObjectHandler< indri::api::ParsedDocument > &handler) |
| void | handle (indri::api::ParsedDocument *document) |
| void | setHint (indri::parse::OffsetAnnotationIndexHint hintType) |
| void | open (const std::string &offsetAnnotationsFile) |
| indri::api::ParsedDocument * | transform (indri::api::ParsedDocument *document) |
Private Member Functions |
| const char * | _getDocno (indri::api::ParsedDocument *document) |
| TagExtent * | _getTag (UINT64 id) |
| AttributeValuePair * | _getAttribute (UINT64 id) |
| bool | _is_unique_id (UINT64 id, int line) |
| UINT64 | parse_UINT64 (const char *str, int n) |
| void | _cleanup () |
| ReadAnnotationTag | parseLine (char *readLine, int lineCounter) |
| void | readAnnotationTags (const char *docno) |
| void | convert_annotations (std::set< indri::parse::TagExtent * > *raw_tags, std::set< indri::parse::TagExtent * > *converted_tags, indri::api::ParsedDocument *document) |
Private Attributes |
| OffsetAnnotationIndexHint | _indexHintType |
| std::string | _offsetAnnotationsFile |
| int | lastBufferAllocationSize |
indri::utility::HashTable<
const char *, std::set<
TagExtent * > * > * | _annotations |
indri::utility::HashTable<
const char *, std::set<
TagExtent * > * > * | _converted_annotations |
indri::utility::HashTable<
UINT64, TagExtent * > * | _tag_id_map |
indri::utility::HashTable<
UINT64, AttributeValuePair * > * | _attribute_id_map |
| std::vector< char * > * | _buffers_allocated |
| bool | _first_open |
| ObjectHandler< indri::api::ParsedDocument > * | _handler |
| Conflater * | _p_conflater |
| std::ifstream | annotationFile |
| int | offsetAnnotationFileLine |
| ReadAnnotationTag | lastReadTag |