#include <HTMLParser.hpp>
Inheritance diagram for indri::parse::HTMLParser:

Public Member Functions | |
| HTMLParser () | |
| ~HTMLParser () | |
Protected Member Functions | |
| virtual void | initialize (TokenizedDocument *tokenized, indri::api::ParsedDocument *parsed) |
| virtual void | cleanup (TokenizedDocument *tokenized, indri::api::ParsedDocument *parsed) |
| virtual void | handleTag (TagEvent *te) |
| void | prepURL (char *s) |
| bool | normalizeURL (char *s) |
Protected Attributes | |
| char | url [MAX_URL_LENGTH] |
| char | base_url [MAX_URL_LENGTH] |
| tag_properties * | _relativeUrlTag |
| tag_properties * | _absoluteUrlTag |
| tag_properties * | _anchorTag |
| indri::utility::Buffer | _urlBuffer |
|
|
|
|
|
|
|
||||||||||||
|
Reimplemented from indri::parse::TaggedTextParser. |
|
|
Reimplemented from indri::parse::TaggedTextParser. |
|
||||||||||||
|
Reimplemented from indri::parse::TaggedTextParser. |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1.3.4