#include "indri/DocumentIteratorFactory.hpp"
#include "indri/PDFDocumentExtractor.hpp"
#include "indri/TaggedDocumentIterator.hpp"
#include "indri/WARCDocumentIterator.hpp"
#include "indri/TextDocumentExtractor.hpp"
#include "indri/MboxDocumentIterator.hpp"
#include <iostream>
#include <locale>
#include "Exception.hpp"
Defines | |
#define | TYPE_TAGGED ( "Tagged Document Collection" ) |
#define | TYPE_WARC ( "WARC Document Collection" ) |
#define | TYPE_PDF ( "Adobe PDF" ) |
#define | TYPE_WORD ( "Microsoft Word" ) |
#define | TYPE_PPT ( "Microsoft PowerPoint" ) |
#define | TYPE_MBOX ( "Mailbox" ) |
#define | TYPE_TEXT ( "Text" ) |
|
|
|
|
|
|
|
|
|
|
|
|
|
|