#include <RawTextParser.hpp>
Public Member Functions | |
| RawTextParser (int memorySize=1024 *1024) | |
| ~RawTextParser () | |
| bool | open (const std::string &fileName) | 
| void | close () | 
| bool | parseDocument (std::string &docName, indri::utility::greedy_vector< char * > &words) | 
Private Attributes | |
| std::ifstream | _in | 
| char * | _buffer | 
| char * | _current | 
| int | _bufferSize | 
      
  | 
  
| 
 
  | 
  
      
  | 
  
| 
 
  | 
  
      
  | 
  
| 
 
  | 
  
      
  | 
  
| 
 
  | 
  
      
  | 
  ||||||||||||
| 
 parses the next document in the filestream, returning a list of char* to words the words are stored in a character buffer within the parser, which means that if you call parseDocument again, all your old word pointers are invalid.  | 
  
      
  | 
  
| 
 
  | 
  
      
  | 
  
| 
 
  | 
  
      
  | 
  
| 
 
  | 
  
      
  | 
  
| 
 
  | 
  
 
1.3.4