|
Public Member Functions |
| OffsetAnnotationAnnotator (Conflater *p_conflater) |
| OffsetAnnotationAnnotator () |
| ~OffsetAnnotationAnnotator () |
void | setTags (const char *docno, const std::vector< indri::parse::TagExtent * > &tagset) |
void | setConflater (Conflater *p_conflater) |
void | setHandler (ObjectHandler< indri::api::ParsedDocument > &handler) |
void | handle (indri::api::ParsedDocument *document) |
void | setHint (indri::parse::OffsetAnnotationIndexHint hintType) |
void | open (const std::string &offsetAnnotationsFile) |
indri::api::ParsedDocument * | transform (indri::api::ParsedDocument *document) |
Private Member Functions |
const char * | _getDocno (indri::api::ParsedDocument *document) |
TagExtent * | _getTag (UINT64 id) |
AttributeValuePair * | _getAttribute (UINT64 id) |
bool | _is_unique_id (UINT64 id, int line) |
UINT64 | parse_UINT64 (const char *str, int n) |
void | _cleanup () |
ReadAnnotationTag | parseLine (char *readLine, int lineCounter) |
void | readAnnotationTags (const char *docno) |
void | convert_annotations (std::set< indri::parse::TagExtent * > *raw_tags, std::set< indri::parse::TagExtent * > *converted_tags, indri::api::ParsedDocument *document) |
Private Attributes |
OffsetAnnotationIndexHint | _indexHintType |
std::string | _offsetAnnotationsFile |
int | lastBufferAllocationSize |
indri::utility::HashTable<
const char *, std::set<
TagExtent * > * > * | _annotations |
indri::utility::HashTable<
const char *, std::set<
TagExtent * > * > * | _converted_annotations |
indri::utility::HashTable<
UINT64, TagExtent * > * | _tag_id_map |
indri::utility::HashTable<
UINT64, AttributeValuePair * > * | _attribute_id_map |
std::vector< char * > * | _buffers_allocated |
bool | _first_open |
ObjectHandler< indri::api::ParsedDocument > * | _handler |
Conflater * | _p_conflater |
std::ifstream | annotationFile |
int | offsetAnnotationFileLine |
ReadAnnotationTag | lastReadTag |