#include <RawTextParser.hpp>
Public Member Functions | |
| RawTextParser (int memorySize=1024 *1024) | |
| ~RawTextParser () | |
| bool | open (const std::string &fileName) |
| void | close () |
| bool | parseDocument (std::string &docName, indri::utility::greedy_vector< char * > &words) |
Private Attributes | |
| std::ifstream | _in |
| char * | _buffer |
| char * | _current |
| int | _bufferSize |
|
|
|
|
|
|
|
|
|
|
|
|
|
||||||||||||
|
parses the next document in the filestream, returning a list of char* to words the words are stored in a character buffer within the parser, which means that if you call parseDocument again, all your old word pointers are invalid. |
|
|
|
|
|
|
|
|
|
|
|
|
1.3.4