#include <stdio.h>
#include <string.h>
#include <errno.h>
#include <stdlib.h>
#include <ctype.h>
#include "indri/TextTokenizer.hpp"
#include "indri/TermExtent.hpp"
#include "indri/TagEvent.hpp"
#include "indri/TokenizedDocument.hpp"
#include "indri/UnparsedDocument.hpp"
#include "indri/UTF8Transcoder.hpp"
#include "indri/AttributeValuePair.hpp"
Classes | |
struct | yy_buffer_state |
struct | yy_trans_info |
Defines | |
#define | YY_INT_ALIGNED short int |
#define | FLEX_SCANNER |
#define | YY_FLEX_MAJOR_VERSION 2 |
#define | YY_FLEX_MINOR_VERSION 5 |
#define | YY_FLEX_SUBMINOR_VERSION 33 |
#define | FLEX_BETA |
#define | INT8_MIN (-128) |
#define | INT16_MIN (-32767-1) |
#define | INT32_MIN (-2147483647-1) |
#define | INT8_MAX (127) |
#define | INT16_MAX (32767) |
#define | INT32_MAX (2147483647) |
#define | UINT8_MAX (255U) |
#define | UINT16_MAX (65535U) |
#define | UINT32_MAX (4294967295U) |
#define | yyconst |
#define | YY_NULL 0 |
#define | YY_SC_TO_UI(c) ((unsigned int) (unsigned char) c) |
#define | BEGIN (yy_start) = 1 + 2 * |
#define | YY_START (((yy_start) - 1) / 2) |
#define | YYSTATE YY_START |
#define | YY_STATE_EOF(state) (YY_END_OF_BUFFER + state + 1) |
#define | YY_NEW_FILE tokrestart(tokin ) |
#define | YY_END_OF_BUFFER_CHAR 0 |
#define | YY_BUF_SIZE 16384 |
#define | YY_STATE_BUF_SIZE ((YY_BUF_SIZE + 2) * sizeof(yy_state_type)) |
#define | EOB_ACT_CONTINUE_SCAN 0 |
#define | EOB_ACT_END_OF_FILE 1 |
#define | EOB_ACT_LAST_MATCH 2 |
#define | YY_LESS_LINENO(n) |
#define | yyless(n) |
#define | unput(c) yyunput( c, (yytext_ptr) ) |
#define | YY_BUFFER_NEW 0 |
#define | YY_BUFFER_NORMAL 1 |
#define | YY_BUFFER_EOF_PENDING 2 |
#define | YY_CURRENT_BUFFER |
#define | YY_CURRENT_BUFFER_LVALUE (yy_buffer_stack)[(yy_buffer_stack_top)] |
#define | YY_FLUSH_BUFFER tok_flush_buffer(YY_CURRENT_BUFFER ) |
#define | yy_new_buffer tok_create_buffer |
#define | yy_set_interactive(is_interactive) |
#define | yy_set_bol(at_bol) |
#define | YY_AT_BOL() (YY_CURRENT_BUFFER_LVALUE->yy_at_bol) |
#define | tokwrap(n) 1 |
#define | YY_SKIP_YYWRAP |
#define | yytext_ptr toktext |
#define | YY_DO_BEFORE_ACTION |
#define | YY_NUM_RULES 14 |
#define | YY_END_OF_BUFFER 15 |
#define | REJECT reject_used_but_not_detected |
#define | yymore() yymore_used_but_not_detected |
#define | YY_MORE_ADJ 0 |
#define | YY_RESTORE_YY_MORE_OFFSET |
#define | ZAP 1 |
#define | TAG 2 |
#define | ASCII_TOKEN 3 |
#define | UTF8_TOKEN 4 |
#define | INITIAL 0 |
#define | COMMENT 1 |
#define | YY_EXTRA_TYPE void * |
#define | YY_READ_BUF_SIZE 8192 |
#define | ECHO (void) fwrite( toktext, tokleng, 1, tokout ) |
#define | YY_INPUT(buf, result, max_size) |
#define | yyterminate() return YY_NULL |
#define | YY_START_STACK_INCR 25 |
#define | YY_FATAL_ERROR(msg) yy_fatal_error( msg ) |
#define | YY_DECL_IS_OURS 1 |
#define | YY_DECL int toklex (void) |
#define | YY_BREAK break; |
#define | YY_RULE_SETUP YY_USER_ACTION |
#define | YY_EXIT_FAILURE 2 |
#define | yyless(n) |
#define | YYTABLES_NAME "yytables" |
Typedefs | |
typedef signed char | flex_int8_t |
typedef short int | flex_int16_t |
typedef int | flex_int32_t |
typedef unsigned char | flex_uint8_t |
typedef unsigned short int | flex_uint16_t |
typedef unsigned int | flex_uint32_t |
typedef yy_buffer_state * | YY_BUFFER_STATE |
typedef unsigned int | yy_size_t |
typedef unsigned char | YY_CHAR |
typedef int | yy_state_type |
Functions | |
void | tokrestart (FILE *input_file) |
void | tok_switch_to_buffer (YY_BUFFER_STATE new_buffer) |
YY_BUFFER_STATE | tok_create_buffer (FILE *file, int size) |
void | tok_delete_buffer (YY_BUFFER_STATE b) |
void | tok_flush_buffer (YY_BUFFER_STATE b) |
void | tokpush_buffer_state (YY_BUFFER_STATE new_buffer) |
void | tokpop_buffer_state (void) |
void | tokensure_buffer_stack (void) |
void | tok_load_buffer_state (void) |
void | tok_init_buffer (YY_BUFFER_STATE b, FILE *file) |
YY_BUFFER_STATE | tok_scan_buffer (char *base, yy_size_t size) |
YY_BUFFER_STATE | tok_scan_string (yyconst char *yy_str) |
YY_BUFFER_STATE | tok_scan_bytes (yyconst char *bytes, int len) |
void * | tokalloc (yy_size_t) |
void * | tokrealloc (void *, yy_size_t) |
void | tokfree (void *) |
yy_state_type | yy_get_previous_state (void) |
yy_state_type | yy_try_NUL_trans (yy_state_type current_state) |
int | yy_get_next_buffer (void) |
void | yy_fatal_error (yyconst char msg[]) |
int | yy_init_globals (void) |
void | yyunput (int c, char *buf_ptr) |
int | input (void) |
int | toklex (void) |
Variables | |
int | tokleng |
FILE * | tokin = (FILE *) 0 *tokout = (FILE *) 0 |
FILE * | tokout |
size_t | yy_buffer_stack_top = 0 |
size_t | yy_buffer_stack_max = 0 |
YY_BUFFER_STATE * | yy_buffer_stack = 0 |
char | yy_hold_char |
int | yy_n_chars |
char * | yy_c_buf_p = (char *) 0 |
int | yy_init = 0 |
int | yy_start = 0 |
int | yy_did_buffer_switch_on_eof |
int | toklineno = 1 |
char * | toktext |
yyconst flex_int16_t | yy_nxt [][256] |
yyconst flex_int16_t | yy_accept [68] |
yy_state_type | yy_last_accepting_state |
char * | yy_last_accepting_cpos |
yyconst yy_state_type | yy_NUL_trans [68] |
int | tok_flex_debug = 0 |
long | byte_position |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
Value: ( (yy_buffer_stack) \ ? (yy_buffer_stack)[(yy_buffer_stack_top)] \ : NULL) |
|
|
|
|
|
|
|
Value: (yytext_ptr) = yy_bp; \ tokleng = (size_t) (yy_cp - yy_bp); \ (yy_hold_char) = *yy_cp; \ *yy_cp = '\0'; \ (yy_c_buf_p) = yy_cp; |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
Value: if ( YY_CURRENT_BUFFER_LVALUE->yy_is_interactive ) \ { \ int c = '*'; \ size_t n; \ for ( n = 0; n < max_size && \ (c = getc( tokin )) != EOF && c != '\n'; ++n ) \ buf[n] = (char) c; \ if ( c == '\n' ) \ buf[n++] = (char) c; \ if ( c == EOF && ferror( tokin ) ) \ YY_FATAL_ERROR( "input in flex scanner failed" ); \ result = n; \ } \ else \ { \ errno=0; \ while ( (result = fread(buf, 1, max_size, tokin))==0 && ferror(tokin)) \ { \ if( errno != EINTR) \ { \ YY_FATAL_ERROR( "input in flex scanner failed" ); \ break; \ } \ errno=0; \ clearerr(tokin); \ } \ }\ \ |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
Value: { \ if ( ! YY_CURRENT_BUFFER ){\ tokensure_buffer_stack (); \ YY_CURRENT_BUFFER_LVALUE = \ tok_create_buffer(tokin,YY_BUF_SIZE ); \ } \ YY_CURRENT_BUFFER_LVALUE->yy_at_bol = at_bol; \ } |
|
Value: { \ if ( ! YY_CURRENT_BUFFER ){ \ tokensure_buffer_stack (); \ YY_CURRENT_BUFFER_LVALUE = \ tok_create_buffer(tokin,YY_BUF_SIZE ); \ } \ YY_CURRENT_BUFFER_LVALUE->yy_is_interactive = is_interactive; \ } |
|
|
|
|
|
|
|
|
|
|
|
|
|
Value: do \ { \ \ int yyless_macro_arg = (n); \ YY_LESS_LINENO(yyless_macro_arg);\ toktext[tokleng] = (yy_hold_char); \ (yy_c_buf_p) = toktext + yyless_macro_arg; \ (yy_hold_char) = *(yy_c_buf_p); \ *(yy_c_buf_p) = '\0'; \ tokleng = yyless_macro_arg; \ } \ while ( 0 ) |
|
Value: do \ { \ \ int yyless_macro_arg = (n); \ YY_LESS_LINENO(yyless_macro_arg);\ *yy_cp = (yy_hold_char); \ YY_RESTORE_YY_MORE_OFFSET \ (yy_c_buf_p) = yy_cp = yy_bp + yyless_macro_arg - YY_MORE_ADJ; \ YY_DO_BEFORE_ACTION; \ } \ while ( 0 ) |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
Initial value: { 0, 0, 0, 0, 0, 15, 13, 12, 13, 9, 13, 9, 13, 9, 11, 2, 2, 2, 2, 4, 2, 2, 2, 2, 0, 0, 9, 10, 8, 9, 11, 0, 0, 2, 2, 2, 2, 0, 2, 2, 2, 2, 2, 0, 0, 7, 0, 0, 0, 0, 5, 0, 6, 2, 2, 2, 3, 2, 2, 2, 2, 2, 0, 10, 8, 1, 2, 2 } |
|
Stack as an array. |
|
capacity of stack. |
|
index of top of stack. |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
Initial value: { 0, 6, 6, 15, 15, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 33, 33, 33, 33, 0, 33, 33, 33, 33, 0, 0, 0, 0, 0, 0, 0, 48, 51, 33, 33, 33, 33, 0, 33, 33, 33, 58, 60, 0, 0, 0, 0, 0, 48, 48, 0, 51, 0, 33, 33, 33, 0, 33, 58, 33, 60, 33, 0, 0, 0, 48, 33, 33 } |
|
|
|
|