NetBSD/usr.bin/lex/main.c

1178 lines
28 KiB
C
Raw Normal View History

1993-05-04 11:44:39 +04:00
/* flex - tool to generate fast lexical analyzers */
1993-03-21 12:45:37 +03:00
/*-
* Copyright (c) 1990 The Regents of the University of California.
* All rights reserved.
*
* This code is derived from software contributed to Berkeley by
1993-05-04 11:44:39 +04:00
* Vern Paxson.
1995-05-05 09:35:08 +04:00
*
1993-05-04 11:44:39 +04:00
* The United States Government has rights in this work pursuant
1993-03-21 12:45:37 +03:00
* to contract no. DE-AC03-76SF00098 between the United States
* Department of Energy and the University of California.
*
1993-05-04 11:44:39 +04:00
* Redistribution and use in source and binary forms are permitted provided
* that: (1) source distributions retain this entire copyright notice and
* comment, and (2) distributions including binaries display the following
* acknowledgement: ``This product includes software developed by the
* University of California, Berkeley and its contributors'' in the
* documentation or other materials provided with the distribution and in
* all advertising materials mentioning features or use of this software.
* Neither the name of the University nor the names of its contributors may
* be used to endorse or promote products derived from this software without
* specific prior written permission.
* THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR IMPLIED
* WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED WARRANTIES OF
* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
1993-03-21 12:45:37 +03:00
*/
#ifndef lint
char copyright[] =
"@(#) Copyright (c) 1990 The Regents of the University of California.\n\
All rights reserved.\n";
#endif /* not lint */
1995-05-05 09:35:08 +04:00
/* $Header: /cvsroot/src/usr.bin/lex/Attic/main.c,v 1.9 1995/05/05 05:35:34 jtc Exp $ */
1993-03-21 12:45:37 +03:00
#include "flexdef.h"
1993-12-02 22:17:24 +03:00
#include "version.h"
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
static char flex_version[] = FLEX_VERSION;
1993-03-21 12:45:37 +03:00
/* declare functions that have forward references */
void flexinit PROTO((int, char**));
1993-12-02 22:17:24 +03:00
void readin PROTO((void));
void set_up_initial_allocations PROTO((void));
1993-03-21 12:45:37 +03:00
1995-05-05 09:35:08 +04:00
#ifdef NEED_ARGV_FIXUP
extern void argv_fixup PROTO((int *, char ***));
#endif
1993-03-21 12:45:37 +03:00
/* these globals are all defined and commented in flexdef.h */
1993-12-02 22:17:24 +03:00
int printstats, syntaxerror, eofseen, ddebug, trace, nowarn, spprdflt;
1995-05-05 09:35:08 +04:00
int interactive, caseins, lex_compat, do_yylineno, useecs, fulltbl, usemecs;
1993-12-02 22:17:24 +03:00
int fullspd, gen_line_dirs, performance_report, backing_up_report;
1995-05-05 09:35:08 +04:00
int C_plus_plus, long_align, use_read, yytext_is_array, do_yywrap, csize;
int yymore_used, reject, real_reject, continued_action, in_rule;
1993-03-21 12:45:37 +03:00
int yymore_really_used, reject_really_used;
1995-05-05 09:35:08 +04:00
int datapos, dataline, linenum, out_linenum;
1993-03-21 12:45:37 +03:00
FILE *skelfile = NULL;
1993-12-02 22:17:24 +03:00
int skel_ind = 0;
char *action_array;
int action_size, defs1_offset, prolog_offset, action_offset, action_index;
1995-05-05 09:35:08 +04:00
char *infilename = NULL, *outfilename = NULL;
int did_outfilename;
char *prefix, *yyclass;
int do_stdinit, use_stdout;
1993-03-21 12:45:37 +03:00
int onestate[ONE_STACK_SIZE], onesym[ONE_STACK_SIZE];
int onenext[ONE_STACK_SIZE], onedef[ONE_STACK_SIZE], onesp;
1995-05-05 09:35:08 +04:00
int current_mns, current_max_rules;
int num_rules, num_eof_rules, default_rule, lastnfa;
1993-03-21 12:45:37 +03:00
int *firstst, *lastst, *finalst, *transchar, *trans1, *trans2;
1993-12-02 22:17:24 +03:00
int *accptnum, *assoc_rule, *state_type;
int *rule_type, *rule_linenum, *rule_useful;
1993-03-21 12:45:37 +03:00
int current_state_type;
int variable_trailing_context_rules;
int numtemps, numprots, protprev[MSP], protnext[MSP], prottbl[MSP];
int protcomst[MSP], firstprot, lastprot, protsave[PROT_SAVE_SIZE];
int numecs, nextecm[CSIZE + 1], ecgroup[CSIZE + 1], nummecs, tecfwd[CSIZE + 1];
int tecbck[CSIZE + 1];
1995-05-05 09:35:08 +04:00
int lastsc, *scset, *scbol, *scxclu, *sceof;
int current_max_scs;
1993-03-21 12:45:37 +03:00
char **scname;
int current_max_dfa_size, current_max_xpairs;
int current_max_template_xpairs, current_max_dfas;
int lastdfa, *nxt, *chk, *tnxt;
int *base, *def, *nultrans, NUL_ec, tblend, firstfree, **dss, *dfasiz;
union dfaacc_union *dfaacc;
int *accsiz, *dhash, numas;
int numsnpairs, jambase, jamstate;
1995-05-05 09:35:08 +04:00
int lastccl, *cclmap, *ccllen, *cclng, cclreuse;
int current_maxccls, current_max_ccl_tbl_size;
1993-03-21 12:45:37 +03:00
Char *ccltbl;
1993-12-02 22:17:24 +03:00
char nmstr[MAXLINE];
1993-03-21 12:45:37 +03:00
int sectnum, nummt, hshcol, dfaeql, numeps, eps2, num_reallocs;
int tmpuses, totnst, peakpairs, numuniq, numdup, hshsave;
1993-12-02 22:17:24 +03:00
int num_backing_up, bol_needed;
FILE *backing_up_file;
1993-03-21 12:45:37 +03:00
int end_of_buffer_state;
char **input_files;
int num_input_files;
1995-05-05 09:35:08 +04:00
/* Make sure program_name is initialized so we don't crash if writing
* out an error message before getting the program name from argv[0].
*/
char *program_name = "flex";
1993-03-21 12:45:37 +03:00
#ifndef SHORT_FILE_NAMES
1993-12-02 22:17:24 +03:00
static char *outfile_template = "lex.%s.%s";
1995-05-05 09:35:08 +04:00
static char *backing_name = "lex.backup";
1993-03-21 12:45:37 +03:00
#else
1993-12-02 22:17:24 +03:00
static char *outfile_template = "lex%s.%s";
1995-05-05 09:35:08 +04:00
static char *backing_name = "lex.bck";
1993-03-21 12:45:37 +03:00
#endif
1993-12-02 22:17:24 +03:00
1995-05-05 09:35:08 +04:00
#ifdef THINK_C
#include <console.h>
#endif
#ifdef MS_DOS
extern unsigned _stklen = 16384;
#endif
static char outfile_path[MAXLINE];
1993-03-21 12:45:37 +03:00
static int outfile_created = 0;
static char *skelname = NULL;
int main( argc, argv )
int argc;
char **argv;
1993-12-02 22:17:24 +03:00
{
int i;
1993-03-21 12:45:37 +03:00
1995-05-05 09:35:08 +04:00
#ifdef THINK_C
argc = ccommand( &argv );
#endif
#ifdef NEED_ARGV_FIXUP
argv_fixup( &argc, &argv );
#endif
1993-12-02 22:17:24 +03:00
flexinit( argc, argv );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
readin();
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
ntod();
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
for ( i = 1; i <= num_rules; ++i )
if ( ! rule_useful[i] && i != default_rule )
1995-05-05 09:35:08 +04:00
line_warning( _( "rule cannot be matched" ),
1993-12-02 22:17:24 +03:00
rule_linenum[i] );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( spprdflt && ! reject && rule_useful[default_rule] )
1995-05-05 09:35:08 +04:00
line_warning(
_( "-s option given but default rule can be matched" ),
1993-12-02 22:17:24 +03:00
rule_linenum[default_rule] );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
/* Generate the C state transition tables from the DFA. */
make_tables();
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
/* Note, flexend does not return. It exits with its argument
* as status.
*/
flexend( 0 );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
return 0; /* keep compilers/lint happy */
}
1993-03-21 12:45:37 +03:00
1995-05-05 09:35:08 +04:00
/* check_options - check user-specified options */
void check_options()
{
int i;
if ( lex_compat )
{
if ( C_plus_plus )
flexerror( _( "Can't use -+ with -l option" ) );
if ( fulltbl || fullspd )
flexerror( _( "Can't use -f or -F with -l option" ) );
/* Don't rely on detecting use of yymore() and REJECT,
* just assume they'll be used.
*/
yymore_really_used = reject_really_used = true;
yytext_is_array = true;
do_yylineno = true;
use_read = false;
}
if ( do_yylineno )
/* This should really be "maintain_backup_tables = true" */
reject_really_used = true;
if ( csize == unspecified )
{
if ( (fulltbl || fullspd) && ! useecs )
csize = DEFAULT_CSIZE;
else
csize = CSIZE;
}
if ( interactive == unspecified )
{
if ( fulltbl || fullspd )
interactive = false;
else
interactive = true;
}
if ( fulltbl || fullspd )
{
if ( usemecs )
flexerror(
_( "-Cf/-CF and -Cm don't make sense together" ) );
if ( interactive )
flexerror( _( "-Cf/-CF and -I are incompatible" ) );
if ( lex_compat )
flexerror(
_( "-Cf/-CF are incompatible with lex-compatibility mode" ) );
if ( do_yylineno )
flexerror(
_( "-Cf/-CF and %option yylineno are incompatible" ) );
if ( fulltbl && fullspd )
flexerror( _( "-Cf and -CF are mutually exclusive" ) );
}
if ( C_plus_plus && fullspd )
flexerror( _( "Can't use -+ with -CF option" ) );
if ( C_plus_plus && yytext_is_array )
{
warn( _( "%array incompatible with -+ option" ) );
yytext_is_array = false;
}
if ( useecs )
{ /* Set up doubly-linked equivalence classes. */
/* We loop all the way up to csize, since ecgroup[csize] is
* the position used for NUL characters.
*/
ecgroup[1] = NIL;
for ( i = 2; i <= csize; ++i )
{
ecgroup[i] = i - 1;
nextecm[i - 1] = i;
}
nextecm[csize] = NIL;
}
else
{
/* Put everything in its own equivalence class. */
for ( i = 1; i <= csize; ++i )
{
ecgroup[i] = i;
nextecm[i] = BAD_SUBSCRIPT; /* to catch errors */
}
}
if ( ! use_stdout )
{
FILE *prev_stdout;
if ( ! did_outfilename )
{
char *suffix;
if ( C_plus_plus )
suffix = "cc";
else
suffix = "c";
sprintf( outfile_path, outfile_template,
prefix, suffix );
outfilename = outfile_path;
}
prev_stdout = freopen( outfilename, "w", stdout );
if ( prev_stdout == NULL )
lerrsf( _( "could not create %s" ), outfilename );
outfile_created = 1;
}
if ( skelname && (skelfile = fopen( skelname, "r" )) == NULL )
lerrsf( _( "can't open skeleton file %s" ), skelname );
if ( strcmp( prefix, "yy" ) )
{
#define GEN_PREFIX(name) out_str3( "#define yy%s %s%s\n", name, prefix, name )
if ( C_plus_plus )
GEN_PREFIX( "FlexLexer" );
else
{
GEN_PREFIX( "_create_buffer" );
GEN_PREFIX( "_delete_buffer" );
GEN_PREFIX( "_scan_buffer" );
GEN_PREFIX( "_scan_string" );
GEN_PREFIX( "_scan_bytes" );
GEN_PREFIX( "_flex_debug" );
GEN_PREFIX( "_init_buffer" );
GEN_PREFIX( "_flush_buffer" );
GEN_PREFIX( "_load_buffer_state" );
GEN_PREFIX( "_switch_to_buffer" );
GEN_PREFIX( "in" );
GEN_PREFIX( "leng" );
GEN_PREFIX( "lex" );
GEN_PREFIX( "out" );
GEN_PREFIX( "restart" );
GEN_PREFIX( "text" );
if ( do_yylineno )
GEN_PREFIX( "lineno" );
}
if ( do_yywrap )
GEN_PREFIX( "wrap" );
outn( "" );
}
if ( did_outfilename )
line_directive_out( stdout, 0 );
skelout();
}
1993-03-21 12:45:37 +03:00
/* flexend - terminate flex
*
* note
* This routine does not return.
*/
1993-12-02 22:17:24 +03:00
void flexend( exit_status )
int exit_status;
1993-03-21 12:45:37 +03:00
{
1993-12-02 22:17:24 +03:00
int tblsiz;
int unlink();
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( skelfile != NULL )
{
if ( ferror( skelfile ) )
1995-05-05 09:35:08 +04:00
lerrsf( _( "input error reading skeleton file %s" ),
skelname );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
else if ( fclose( skelfile ) )
1995-05-05 09:35:08 +04:00
lerrsf( _( "error closing skeleton file %s" ),
skelname );
1993-12-02 22:17:24 +03:00
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( exit_status != 0 && outfile_created )
{
if ( ferror( stdout ) )
1995-05-05 09:35:08 +04:00
lerrsf( _( "error writing output file %s" ),
outfilename );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
else if ( fclose( stdout ) )
1995-05-05 09:35:08 +04:00
lerrsf( _( "error closing output file %s" ),
outfilename );
1993-03-21 12:45:37 +03:00
1995-05-05 09:35:08 +04:00
else if ( unlink( outfilename ) )
lerrsf( _( "error deleting output file %s" ),
outfilename );
1993-12-02 22:17:24 +03:00
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( backing_up_report && backing_up_file )
{
if ( num_backing_up == 0 )
1995-05-05 09:35:08 +04:00
fprintf( backing_up_file, _( "No backing up.\n" ) );
1993-12-02 22:17:24 +03:00
else if ( fullspd || fulltbl )
fprintf( backing_up_file,
1995-05-05 09:35:08 +04:00
_( "%d backing up (non-accepting) states.\n" ),
1993-12-02 22:17:24 +03:00
num_backing_up );
else
fprintf( backing_up_file,
1995-05-05 09:35:08 +04:00
_( "Compressed tables always back up.\n" ) );
1993-12-02 22:17:24 +03:00
if ( ferror( backing_up_file ) )
1995-05-05 09:35:08 +04:00
lerrsf( _( "error writing backup file %s" ),
backing_name );
1993-12-02 22:17:24 +03:00
else if ( fclose( backing_up_file ) )
1995-05-05 09:35:08 +04:00
lerrsf( _( "error closing backup file %s" ),
backing_name );
1993-12-02 22:17:24 +03:00
}
1993-03-21 12:45:37 +03:00
if ( printstats )
1993-12-02 22:17:24 +03:00
{
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( "%s version %s usage statistics:\n" ),
1993-12-02 22:17:24 +03:00
program_name, flex_version );
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( " scanner options: -" ) );
1993-12-02 22:17:24 +03:00
if ( C_plus_plus )
putc( '+', stderr );
if ( backing_up_report )
putc( 'b', stderr );
if ( ddebug )
putc( 'd', stderr );
if ( caseins )
putc( 'i', stderr );
if ( lex_compat )
putc( 'l', stderr );
if ( performance_report > 0 )
putc( 'p', stderr );
if ( performance_report > 1 )
putc( 'p', stderr );
if ( spprdflt )
putc( 's', stderr );
if ( use_stdout )
putc( 't', stderr );
if ( printstats )
putc( 'v', stderr ); /* always true! */
if ( nowarn )
putc( 'w', stderr );
1995-05-05 09:35:08 +04:00
if ( interactive == false )
1993-12-02 22:17:24 +03:00
putc( 'B', stderr );
1995-05-05 09:35:08 +04:00
if ( interactive == true )
1993-12-02 22:17:24 +03:00
putc( 'I', stderr );
if ( ! gen_line_dirs )
putc( 'L', stderr );
if ( trace )
putc( 'T', stderr );
1995-05-05 09:35:08 +04:00
if ( csize == unspecified )
/* We encountered an error fairly early on, so csize
* never got specified. Define it now, to prevent
* bogus table sizes being written out below.
*/
csize = 256;
1993-12-02 22:17:24 +03:00
if ( csize == 128 )
putc( '7', stderr );
else
putc( '8', stderr );
fprintf( stderr, " -C" );
if ( long_align )
putc( 'a', stderr );
if ( fulltbl )
putc( 'f', stderr );
if ( fullspd )
putc( 'F', stderr );
if ( useecs )
putc( 'e', stderr );
if ( usemecs )
putc( 'm', stderr );
if ( use_read )
putc( 'r', stderr );
1995-05-05 09:35:08 +04:00
if ( did_outfilename )
fprintf( stderr, " -o%s", outfilename );
1993-12-02 22:17:24 +03:00
if ( skelname )
fprintf( stderr, " -S%s", skelname );
1994-01-07 02:58:18 +03:00
if ( strcmp( prefix, "yy" ) )
1993-12-02 22:17:24 +03:00
fprintf( stderr, " -P%s", prefix );
putc( '\n', stderr );
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( " %d/%d NFA states\n" ),
lastnfa, current_mns );
fprintf( stderr, _( " %d/%d DFA states (%d words)\n" ),
lastdfa, current_max_dfas, totnst );
fprintf( stderr, _( " %d rules\n" ),
1993-12-02 22:17:24 +03:00
num_rules + num_eof_rules - 1 /* - 1 for def. rule */ );
if ( num_backing_up == 0 )
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( " No backing up\n" ) );
1993-12-02 22:17:24 +03:00
else if ( fullspd || fulltbl )
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( " %d backing-up (non-accepting) states\n" ),
1993-12-02 22:17:24 +03:00
num_backing_up );
else
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( " Compressed tables always back-up\n" ) );
1993-12-02 22:17:24 +03:00
if ( bol_needed )
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( " Beginning-of-line patterns used\n" ) );
1993-12-02 22:17:24 +03:00
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( " %d/%d start conditions\n" ), lastsc,
1993-12-02 22:17:24 +03:00
current_max_scs );
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( " %d epsilon states, %d double epsilon states\n" ),
1993-12-02 22:17:24 +03:00
numeps, eps2 );
if ( lastccl == 0 )
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( " no character classes\n" ) );
1993-12-02 22:17:24 +03:00
else
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( " %d/%d character classes needed %d/%d words of storage, %d reused\n" ),
1993-12-02 22:17:24 +03:00
lastccl, current_maxccls,
cclmap[lastccl] + ccllen[lastccl],
current_max_ccl_tbl_size, cclreuse );
1993-03-21 12:45:37 +03:00
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( " %d state/nextstate pairs created\n" ),
1993-12-02 22:17:24 +03:00
numsnpairs );
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( " %d/%d unique/duplicate transitions\n" ),
1993-12-02 22:17:24 +03:00
numuniq, numdup );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( fulltbl )
{
tblsiz = lastdfa * numecs;
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( " %d table entries\n" ), tblsiz );
1993-12-02 22:17:24 +03:00
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
else
{
tblsiz = 2 * (lastdfa + numtemps) + 2 * tblend;
1995-05-05 09:35:08 +04:00
fprintf( stderr,
_( " %d/%d base-def entries created\n" ),
1993-12-02 22:17:24 +03:00
lastdfa + numtemps, current_max_dfas );
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( " %d/%d (peak %d) nxt-chk entries created\n" ),
1993-12-02 22:17:24 +03:00
tblend, current_max_xpairs, peakpairs );
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( " %d/%d (peak %d) template nxt-chk entries created\n" ),
numtemps * nummecs,
current_max_template_xpairs,
1993-12-02 22:17:24 +03:00
numtemps * numecs );
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( " %d empty table entries\n" ),
nummt );
fprintf( stderr, _( " %d protos created\n" ),
numprots );
fprintf( stderr,
_( " %d templates created, %d uses\n" ),
1993-12-02 22:17:24 +03:00
numtemps, tmpuses );
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( useecs )
{
tblsiz = tblsiz + csize;
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( " %d/%d equivalence classes created\n" ),
1993-12-02 22:17:24 +03:00
numecs, csize );
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( usemecs )
{
tblsiz = tblsiz + numecs;
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( " %d/%d meta-equivalence classes created\n" ),
1993-12-02 22:17:24 +03:00
nummecs, csize );
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( " %d (%d saved) hash collisions, %d DFAs equal\n" ),
1993-12-02 22:17:24 +03:00
hshcol, hshsave, dfaeql );
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( " %d sets of reallocations needed\n" ),
1993-12-02 22:17:24 +03:00
num_reallocs );
1995-05-05 09:35:08 +04:00
fprintf( stderr, _( " %d total table entries needed\n" ),
tblsiz );
1993-12-02 22:17:24 +03:00
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
exit( exit_status );
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
/* flexinit - initialize flex */
1993-03-21 12:45:37 +03:00
void flexinit( argc, argv )
int argc;
char **argv;
{
1993-12-02 22:17:24 +03:00
int i, sawcmpflag;
char *arg, *mktemp();
printstats = syntaxerror = trace = spprdflt = caseins = false;
1995-05-05 09:35:08 +04:00
lex_compat = C_plus_plus = backing_up_report = ddebug = fulltbl = false;
fullspd = long_align = nowarn = yymore_used = continued_action = false;
do_yylineno = yytext_is_array = in_rule = reject = do_stdinit = false;
yymore_really_used = reject_really_used = unspecified;
interactive = csize = unspecified;
do_yywrap = gen_line_dirs = usemecs = useecs = true;
1993-12-02 22:17:24 +03:00
performance_report = 0;
1995-05-05 09:35:08 +04:00
did_outfilename = 0;
prefix = "yy";
yyclass = 0;
use_read = use_stdout = false;
1993-12-02 22:17:24 +03:00
sawcmpflag = false;
/* Initialize dynamic array for holding the rule actions. */
action_size = 2048; /* default size of action array in bytes */
action_array = allocate_character_array( action_size );
defs1_offset = prolog_offset = action_offset = action_index = 0;
action_array[0] = '\0';
program_name = argv[0];
if ( program_name[0] != '\0' &&
1994-01-07 02:58:18 +03:00
program_name[strlen( program_name ) - 1] == '+' )
1993-12-02 22:17:24 +03:00
C_plus_plus = true;
/* read flags */
for ( --argc, ++argv; argc ; --argc, ++argv )
{
1995-05-05 09:35:08 +04:00
arg = argv[0];
if ( arg[0] != '-' || arg[1] == '\0' )
1993-12-02 22:17:24 +03:00
break;
1993-03-21 12:45:37 +03:00
1995-05-05 09:35:08 +04:00
if ( arg[1] == '-' )
{ /* --option */
if ( ! strcmp( arg, "--help" ) )
arg = "-h";
else if ( ! strcmp( arg, "--version" ) )
arg = "-V";
else if ( ! strcmp( arg, "--" ) )
{ /* end of options */
--argc;
++argv;
break;
}
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
for ( i = 1; arg[i] != '\0'; ++i )
switch ( arg[i] )
{
case '+':
C_plus_plus = true;
break;
case 'B':
interactive = false;
break;
case 'b':
backing_up_report = true;
break;
case 'c':
1995-05-05 09:35:08 +04:00
break;
1993-12-02 22:17:24 +03:00
case 'C':
if ( i != 1 )
flexerror(
1995-05-05 09:35:08 +04:00
_( "-C flag must be given separately" ) );
1993-12-02 22:17:24 +03:00
if ( ! sawcmpflag )
{
useecs = false;
usemecs = false;
fulltbl = false;
sawcmpflag = true;
}
for ( ++i; arg[i] != '\0'; ++i )
switch ( arg[i] )
{
case 'a':
long_align =
true;
break;
case 'e':
useecs = true;
break;
case 'F':
fullspd = true;
break;
case 'f':
fulltbl = true;
break;
case 'm':
usemecs = true;
break;
case 'r':
use_read = true;
break;
default:
lerrif(
1995-05-05 09:35:08 +04:00
_( "unknown -C option '%c'" ),
1993-12-02 22:17:24 +03:00
(int) arg[i] );
break;
}
goto get_next_arg;
case 'd':
ddebug = true;
break;
case 'f':
useecs = usemecs = false;
use_read = fulltbl = true;
break;
case 'F':
useecs = usemecs = false;
use_read = fullspd = true;
break;
1995-05-05 09:35:08 +04:00
case '?':
1993-12-02 22:17:24 +03:00
case 'h':
usage();
exit( 0 );
case 'I':
interactive = true;
break;
case 'i':
caseins = true;
break;
case 'l':
lex_compat = true;
break;
case 'L':
gen_line_dirs = false;
break;
case 'n':
/* Stupid do-nothing deprecated
* option.
*/
break;
1995-05-05 09:35:08 +04:00
case 'o':
if ( i != 1 )
flexerror(
_( "-o flag must be given separately" ) );
outfilename = arg + i + 1;
did_outfilename = 1;
goto get_next_arg;
1993-12-02 22:17:24 +03:00
case 'P':
if ( i != 1 )
flexerror(
1995-05-05 09:35:08 +04:00
_( "-P flag must be given separately" ) );
1993-12-02 22:17:24 +03:00
prefix = arg + i + 1;
goto get_next_arg;
case 'p':
++performance_report;
break;
case 'S':
if ( i != 1 )
flexerror(
1995-05-05 09:35:08 +04:00
_( "-S flag must be given separately" ) );
1993-12-02 22:17:24 +03:00
skelname = arg + i + 1;
goto get_next_arg;
case 's':
spprdflt = true;
break;
case 't':
use_stdout = true;
break;
case 'T':
trace = true;
break;
case 'v':
printstats = true;
break;
case 'V':
1995-05-05 09:35:08 +04:00
printf( _( "%s version %s\n" ),
1993-12-02 22:17:24 +03:00
program_name, flex_version );
exit( 0 );
case 'w':
nowarn = true;
break;
case '7':
csize = 128;
break;
case '8':
csize = CSIZE;
break;
default:
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( "%s: unknown flag '%c'. For usage, try\n\t%s --help\n" ),
program_name, (int) arg[i],
program_name );
1993-12-02 22:17:24 +03:00
exit( 1 );
}
1995-05-05 09:35:08 +04:00
/* Used by -C, -S, -o, and -P flags in lieu of a "continue 2"
1993-12-02 22:17:24 +03:00
* control.
*/
get_next_arg: ;
}
num_input_files = argc;
input_files = argv;
set_input_file( num_input_files > 0 ? input_files[0] : NULL );
1993-03-21 12:45:37 +03:00
1995-05-05 09:35:08 +04:00
lastccl = lastsc = lastdfa = lastnfa = 0;
1993-12-02 22:17:24 +03:00
num_rules = num_eof_rules = default_rule = 0;
numas = numsnpairs = tmpuses = 0;
numecs = numeps = eps2 = num_reallocs = hshcol = dfaeql = totnst = 0;
numuniq = numdup = hshsave = eofseen = datapos = dataline = 0;
num_backing_up = onesp = numprots = 0;
variable_trailing_context_rules = bol_needed = false;
1993-03-21 12:45:37 +03:00
1995-05-05 09:35:08 +04:00
out_linenum = linenum = sectnum = 1;
1993-12-02 22:17:24 +03:00
firstprot = NIL;
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
/* Used in mkprot() so that the first proto goes in slot 1
* of the proto queue.
*/
lastprot = 1;
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
set_up_initial_allocations();
1993-03-21 12:45:37 +03:00
}
1993-12-02 22:17:24 +03:00
/* readin - read in the rules section of the input file(s) */
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
void readin()
{
1995-05-05 09:35:08 +04:00
static char yy_stdinit[] = "FILE *yyin = stdin, *yyout = stdout;";
static char yy_nostdinit[] =
"FILE *yyin = (FILE *) 0, *yyout = (FILE *) 0;";
1993-03-21 12:45:37 +03:00
1995-05-05 09:35:08 +04:00
line_directive_out( (FILE *) 0, 1 );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( yyparse() )
{
1995-05-05 09:35:08 +04:00
pinpoint_message( _( "fatal parse error" ) );
1993-12-02 22:17:24 +03:00
flexend( 1 );
}
1993-03-21 12:45:37 +03:00
1993-12-14 05:09:50 +03:00
if ( syntaxerror )
flexend( 1 );
1995-05-05 09:35:08 +04:00
if ( backing_up_report )
{
backing_up_file = fopen( backing_name, "w" );
if ( backing_up_file == NULL )
lerrsf(
_( "could not create backing-up info file %s" ),
backing_name );
}
else
backing_up_file = NULL;
if ( yymore_really_used == true )
1993-12-14 05:09:50 +03:00
yymore_used = true;
1995-05-05 09:35:08 +04:00
else if ( yymore_really_used == false )
1993-12-14 05:09:50 +03:00
yymore_used = false;
1995-05-05 09:35:08 +04:00
if ( reject_really_used == true )
1993-12-14 05:09:50 +03:00
reject = true;
1995-05-05 09:35:08 +04:00
else if ( reject_really_used == false )
1993-12-14 05:09:50 +03:00
reject = false;
if ( performance_report > 0 )
{
if ( lex_compat )
{
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( "-l AT&T lex compatibility option entails a large performance penalty\n" ) );
fprintf( stderr,
_( " and may be the actual source of other reported performance penalties\n" ) );
}
else if ( do_yylineno )
{
1993-12-14 05:09:50 +03:00
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( "%%option yylineno entails a large performance penalty\n" ) );
1993-12-14 05:09:50 +03:00
}
if ( performance_report > 1 )
{
if ( interactive )
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( "-I (interactive) entails a minor performance penalty\n" ) );
1993-12-14 05:09:50 +03:00
if ( yymore_used )
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( "yymore() entails a minor performance penalty\n" ) );
1993-12-14 05:09:50 +03:00
}
if ( reject )
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( "REJECT entails a large performance penalty\n" ) );
1993-12-14 05:09:50 +03:00
if ( variable_trailing_context_rules )
fprintf( stderr,
1995-05-05 09:35:08 +04:00
_( "Variable trailing context rules entail a large performance penalty\n" ) );
1993-12-14 05:09:50 +03:00
}
if ( reject )
real_reject = true;
if ( variable_trailing_context_rules )
reject = true;
if ( (fulltbl || fullspd) && reject )
{
if ( real_reject )
1995-05-05 09:35:08 +04:00
flexerror(
_( "REJECT cannot be used with -f or -F" ) );
else if ( do_yylineno )
flexerror(
_( "%option yylineno cannot be used with -f or -F" ) );
1993-12-14 05:09:50 +03:00
else
flexerror(
1995-05-05 09:35:08 +04:00
_( "variable trailing context rules cannot be used with -f or -F" ) );
}
if ( reject )
outn( "\n#define YY_USES_REJECT" );
if ( ! do_yywrap )
{
outn( "\n#define yywrap() 1" );
outn( "#define YY_SKIP_YYWRAP" );
1993-12-14 05:09:50 +03:00
}
1995-05-05 09:35:08 +04:00
if ( ddebug )
outn( "\n#define FLEX_DEBUG" );
1993-12-02 22:17:24 +03:00
if ( csize == 256 )
1995-05-05 09:35:08 +04:00
outn( "typedef unsigned char YY_CHAR;" );
1993-12-02 22:17:24 +03:00
else
1995-05-05 09:35:08 +04:00
outn( "typedef char YY_CHAR;" );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( C_plus_plus )
{
1995-05-05 09:35:08 +04:00
outn( "#define yytext_ptr yytext" );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( interactive )
1995-05-05 09:35:08 +04:00
outn( "#define YY_INTERACTIVE" );
}
else
{
if ( do_stdinit )
{
outn( "#ifdef VMS" );
outn( "#ifndef __VMS_POSIX" );
outn( yy_nostdinit );
outn( "#else" );
outn( yy_stdinit );
outn( "#endif" );
outn( "#else" );
outn( yy_stdinit );
outn( "#endif" );
}
else
outn( yy_nostdinit );
1993-12-02 22:17:24 +03:00
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( fullspd )
1995-05-05 09:35:08 +04:00
outn( "typedef yyconst struct yy_trans_info *yy_state_type;" );
1993-12-06 22:29:01 +03:00
else if ( ! C_plus_plus )
1995-05-05 09:35:08 +04:00
outn( "typedef int yy_state_type;" );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( ddebug )
1995-05-05 09:35:08 +04:00
outn( "\n#define FLEX_DEBUG" );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( lex_compat )
1995-05-05 09:35:08 +04:00
outn( "#define YY_FLEX_LEX_COMPAT" );
if ( do_yylineno && ! C_plus_plus )
1993-12-02 22:17:24 +03:00
{
1995-05-05 09:35:08 +04:00
outn( "extern int yylineno;" );
outn( "int yylineno = 1;" );
1993-12-02 22:17:24 +03:00
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( C_plus_plus )
1995-05-05 09:35:08 +04:00
{
outn( "\n#include <FlexLexer.h>" );
if ( yyclass )
{
outn( "int yyFlexLexer::yylex()" );
outn( "\t{" );
outn(
"\tLexerError( \"yyFlexLexer::yylex invoked but %option yyclass used\" );" );
outn( "\treturn 0;" );
outn( "\t}" );
out_str( "\n#define YY_DECL int %s::yylex()\n",
yyclass );
}
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
else
{
if ( yytext_is_array )
1995-05-05 09:35:08 +04:00
outn( "extern char yytext[];\n" );
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
else
{
1995-05-05 09:35:08 +04:00
outn( "extern char *yytext;" );
outn( "#define yytext_ptr yytext" );
1993-12-02 22:17:24 +03:00
}
1995-05-05 09:35:08 +04:00
if ( yyclass )
flexerror(
_( "%option yyclass only meaningful for C++ scanners" ) );
1993-12-02 22:17:24 +03:00
}
1993-03-21 12:45:37 +03:00
1993-12-02 22:17:24 +03:00
if ( useecs )
numecs = cre8ecs( nextecm, ecgroup, csize );
else
numecs = csize;
/* Now map the equivalence class for NUL to its expected place. */
ecgroup[0] = ecgroup[csize];
1993-12-09 22:06:03 +03:00
NUL_ec = ABS( ecgroup[0] );
1993-12-02 22:17:24 +03:00
if ( useecs )
ccl2ecl();
}
1993-03-21 12:45:37 +03:00
/* set_up_initial_allocations - allocate memory for internal tables */
void set_up_initial_allocations()
1993-12-02 22:17:24 +03:00
{
current_mns = INITIAL_MNS;
firstst = allocate_integer_array( current_mns );
lastst = allocate_integer_array( current_mns );
finalst = allocate_integer_array( current_mns );
transchar = allocate_integer_array( current_mns );
trans1 = allocate_integer_array( current_mns );
trans2 = allocate_integer_array( current_mns );
accptnum = allocate_integer_array( current_mns );
assoc_rule = allocate_integer_array( current_mns );
state_type = allocate_integer_array( current_mns );
current_max_rules = INITIAL_MAX_RULES;
rule_type = allocate_integer_array( current_max_rules );
rule_linenum = allocate_integer_array( current_max_rules );
rule_useful = allocate_integer_array( current_max_rules );
current_max_scs = INITIAL_MAX_SCS;
scset = allocate_integer_array( current_max_scs );
scbol = allocate_integer_array( current_max_scs );
scxclu = allocate_integer_array( current_max_scs );
sceof = allocate_integer_array( current_max_scs );
scname = allocate_char_ptr_array( current_max_scs );
current_maxccls = INITIAL_MAX_CCLS;
cclmap = allocate_integer_array( current_maxccls );
ccllen = allocate_integer_array( current_maxccls );
cclng = allocate_integer_array( current_maxccls );
current_max_ccl_tbl_size = INITIAL_MAX_CCL_TBL_SIZE;
ccltbl = allocate_Character_array( current_max_ccl_tbl_size );
current_max_dfa_size = INITIAL_MAX_DFA_SIZE;
current_max_xpairs = INITIAL_MAX_XPAIRS;
nxt = allocate_integer_array( current_max_xpairs );
chk = allocate_integer_array( current_max_xpairs );
current_max_template_xpairs = INITIAL_MAX_TEMPLATE_XPAIRS;
tnxt = allocate_integer_array( current_max_template_xpairs );
current_max_dfas = INITIAL_MAX_DFAS;
base = allocate_integer_array( current_max_dfas );
def = allocate_integer_array( current_max_dfas );
dfasiz = allocate_integer_array( current_max_dfas );
accsiz = allocate_integer_array( current_max_dfas );
dhash = allocate_integer_array( current_max_dfas );
dss = allocate_int_ptr_array( current_max_dfas );
dfaacc = allocate_dfaacc_union( current_max_dfas );
nultrans = (int *) 0;
}
void usage()
{
1995-05-05 09:35:08 +04:00
FILE *f = stdout;
fprintf( f,
_( "%s [-bcdfhilnpstvwBFILTV78+? -C[aefFmr] -ooutput -Pprefix -Sskeleton]\n" ),
1993-12-02 22:17:24 +03:00
program_name );
1995-05-05 09:35:08 +04:00
fprintf( f, _( "\t[--help --version] [file ...]\n" ) );
fprintf( f, _( "\t-b generate backing-up information to %s\n" ),
backing_name );
fprintf( f, _( "\t-c do-nothing POSIX option\n" ) );
fprintf( f, _( "\t-d turn on debug mode in generated scanner\n" ) );
fprintf( f, _( "\t-f generate fast, large scanner\n" ) );
fprintf( f, _( "\t-h produce this help message\n" ) );
fprintf( f, _( "\t-i generate case-insensitive scanner\n" ) );
fprintf( f, _( "\t-l maximal compatibility with original lex\n" ) );
fprintf( f, _( "\t-n do-nothing POSIX option\n" ) );
fprintf( f, _( "\t-p generate performance report to stderr\n" ) );
fprintf( f,
_( "\t-s suppress default rule to ECHO unmatched text\n" ) );
if ( ! did_outfilename )
{
sprintf( outfile_path, outfile_template,
prefix, C_plus_plus ? "cc" : "c" );
outfilename = outfile_path;
}
1993-03-21 12:45:37 +03:00
1995-05-05 09:35:08 +04:00
fprintf( f,
_( "\t-t write generated scanner on stdout instead of %s\n" ),
outfilename );
fprintf( f,
_( "\t-v write summary of scanner statistics to f\n" ) );
fprintf( f, _( "\t-w do not generate warnings\n" ) );
fprintf( f, _( "\t-B generate batch scanner (opposite of -I)\n" ) );
fprintf( f,
_( "\t-F use alternative fast scanner representation\n" ) );
fprintf( f,
_( "\t-I generate interactive scanner (opposite of -B)\n" ) );
fprintf( f, _( "\t-L suppress #line directives in scanner\n" ) );
fprintf( f, _( "\t-T %s should run in trace mode\n" ), program_name );
fprintf( f, _( "\t-V report %s version\n" ), program_name );
fprintf( f, _( "\t-7 generate 7-bit scanner\n" ) );
fprintf( f, _( "\t-8 generate 8-bit scanner\n" ) );
fprintf( f, _( "\t-+ generate C++ scanner class\n" ) );
fprintf( f, _( "\t-? produce this help message\n" ) );
fprintf( f,
_( "\t-C specify degree of table compression (default is -Cem):\n" ) );
fprintf( f,
_( "\t\t-Ca trade off larger tables for better memory alignment\n" ) );
fprintf( f, _( "\t\t-Ce construct equivalence classes\n" ) );
fprintf( f,
_( "\t\t-Cf do not compress scanner tables; use -f representation\n" ) );
fprintf( f,
_( "\t\t-CF do not compress scanner tables; use -F representation\n" ) );
fprintf( f, _( "\t\t-Cm construct meta-equivalence classes\n" ) );
fprintf( f,
_( "\t\t-Cr use read() instead of stdio for scanner input\n" ) );
fprintf( f, _( "\t-o specify output filename\n" ) );
fprintf( f, _( "\t-P specify scanner prefix other than \"yy\"\n" ) );
fprintf( f, _( "\t-S specify skeleton file\n" ) );
fprintf( f, _( "\t--help produce this help message\n" ) );
fprintf( f, _( "\t--version report %s version\n" ), program_name );
1993-12-02 22:17:24 +03:00
}