#include <HTMLParser.hpp>
Inheritance diagram for indri::parse::HTMLParser:
Public Member Functions | |
HTMLParser () | |
~HTMLParser () | |
Protected Member Functions | |
virtual void | initialize (TokenizedDocument *tokenized, indri::api::ParsedDocument *parsed) |
virtual void | cleanup (TokenizedDocument *tokenized, indri::api::ParsedDocument *parsed) |
virtual void | handleTag (TagEvent *te) |
void | prepURL (char *s) |
bool | normalizeURL (char *s) |
Protected Attributes | |
char | url [MAX_URL_LENGTH] |
char | base_url [MAX_URL_LENGTH] |
tag_properties * | _relativeUrlTag |
tag_properties * | _absoluteUrlTag |
tag_properties * | _anchorTag |
indri::utility::Buffer | _urlBuffer |
|
|
|
|
|
Reimplemented from indri::parse::TaggedTextParser. |
|
Reimplemented from indri::parse::TaggedTextParser. |
|
Reimplemented from indri::parse::TaggedTextParser. |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|