src - FreeBSD source tree

diff options


context:
space:
mode:

author	Geoff Rehmet <csgr@FreeBSD.org>	1994-08-24 13:10:34 +0000
committer	Geoff Rehmet <csgr@FreeBSD.org>	1994-08-24 13:10:34 +0000
commit	8387c24d794dc69c6d3d27b2326e6019518bdfc4 (patch)
tree	c1ef3d28221496e6e87f29d5b1970f4b29776afa
download	src-8387c24d794dc69c6d3d27b2326e6019518bdfc4.tar.gz src-8387c24d794dc69c6d3d27b2326e6019518bdfc4.zip

Flex version 2.4.7 from LBLvendor/flex/2.4.7

Reviewed by: Geoff.

Notes

Notes: svn path=/vendor/flex/dist/; revision=2258 svn path=/vendor/flex/2.4.7/; revision=2260; tag=vendor/flex/2.4.7

Diffstat

-rw-r--r--

usr.bin/lex/COPYING

-rw-r--r--

usr.bin/lex/FlexLexer.h

175

-rw-r--r--

usr.bin/lex/Makefile

-rw-r--r--

usr.bin/lex/NEWS

703

-rw-r--r--

usr.bin/lex/README

-rw-r--r--

usr.bin/lex/ccl.c

149

-rw-r--r--

usr.bin/lex/dfa.c

1085

-rw-r--r--

usr.bin/lex/ecs.c

225

-rw-r--r--

usr.bin/lex/flex.skl

1225

-rw-r--r--

usr.bin/lex/flexdef.h

902

-rw-r--r--

usr.bin/lex/flexdoc.1

3045

-rw-r--r--

usr.bin/lex/gen.c

1461

-rw-r--r--

usr.bin/lex/initscan.c

2723

-rw-r--r--

usr.bin/lex/lex.1

1001

-rw-r--r--

usr.bin/lex/lib/Makefile

-rw-r--r--

usr.bin/lex/lib/libmain.c

-rw-r--r--

usr.bin/lex/lib/libyywrap.c

-rw-r--r--

usr.bin/lex/main.c

989

-rw-r--r--

usr.bin/lex/misc.c

773

-rwxr-xr-x

usr.bin/lex/mkskel.sh

-rw-r--r--

usr.bin/lex/nfa.c

709

-rw-r--r--

usr.bin/lex/parse.y

817

-rw-r--r--

usr.bin/lex/scan.l

572

-rw-r--r--

usr.bin/lex/skel.c

1232

-rw-r--r--

usr.bin/lex/sym.c

262

-rw-r--r--

usr.bin/lex/tblcmp.c

888

-rw-r--r--

usr.bin/lex/version.h

-rw-r--r--

usr.bin/lex/yylex.c

199

28 files changed, 19354 insertions, 0 deletions

diff --git a/usr.bin/lex/COPYING b/usr.bin/lex/COPYING
new file mode 100644
index 000000000000..dcb775e7c606
--- /dev/null
+++ b/usr.bin/lex/COPYING

@@ -0,0 +1,38 @@

+Flex carries the copyright used for BSD software, slightly modified

+because it originated at the Lawrence Berkeley (not Livermore!) Laboratory,

+which operates under a contract with the Department of Energy:

+ This code is derived from software contributed to Berkeley by

+ Vern Paxson.

+ The United States Government has rights in this work pursuant

+ to contract no. DE-AC03-76SF00098 between the United States

+ Department of Energy and the University of California.

+ Redistribution and use in source and binary forms are permitted

+ provided that: (1) source distributions retain this entire

+ copyright notice and comment, and (2) distributions including

+ binaries display the following acknowledgement: ``This product

+ includes software developed by the University of California,

+ Berkeley and its contributors'' in the documentation or other

+ materials provided with the distribution and in all advertising

+ materials mentioning features or use of this software. Neither the

+ name of the University nor the names of its contributors may be

+ used to endorse or promote products derived from this software

+ without specific prior written permission.

+ THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR

+ IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED

+ WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR

+ PURPOSE.

+This basically says "do whatever you please with this software except

+remove this notice or take advantage of the University's (or the flex

+authors') name".

+Note that the "flex.skl" scanner skeleton carries no copyright notice.

+You are free to do whatever you please with scanners generated using flex;

+for them, you are not even bound by the above copyright.

diff --git a/usr.bin/lex/FlexLexer.h b/usr.bin/lex/FlexLexer.h
new file mode 100644
index 000000000000..feb40b66265d
--- /dev/null
+++ b/usr.bin/lex/FlexLexer.h

@@ -0,0 +1,175 @@

+// $Header: FlexLexer.h,v 1.2 94/01/04 14:57:26 vern Exp $

+// FlexLexer.h -- define classes for lexical analyzers generated by flex

+//

+// This code is derived from software contributed to Berkeley by

+// Kent Williams and Tom Epperly.

+//

+// Redistribution and use in source and binary forms are permitted provided

+// that: (1) source distributions retain this entire copyright notice and

+// comment, and (2) distributions including binaries display the following

+// acknowledgement: ``This product includes software developed by the

+// University of California, Berkeley and its contributors'' in the

+// documentation or other materials provided with the distribution and in

+// all advertising materials mentioning features or use of this software.

+// Neither the name of the University nor the names of its contributors may

+// be used to endorse or promote products derived from this software without

+// specific prior written permission.

+// THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR IMPLIED

+// WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED WARRANTIES OF

+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.

+#ifndef __FLEX_LEXER_H

+#define __FLEX_LEXER_H

+// This file defines two classes. The first, FlexLexer, is an abstract

+// class which specifies the external interface provided to flex C++

+// lexer objects. The second, yyFlexLexer, fills out most of the meat

+// of the lexer class; its internals may vary from lexer to lexer

+// depending on things like whether REJECT is used.

+//

+// If you want to create multiple lexer classes, you use the -P flag

+// to rename each yyFlexLexer to some other xxFlexLexer.

+#include <iostream.h>

+extern "C++" {

+struct yy_buffer_state;

+typedef int yy_state_type;

+class FlexLexer {

+public:

+ virtual ~FlexLexer() { }

+ const char* YYText() { return yytext; }

+ int YYLeng() { return yyleng; }

+ virtual void

+ yy_switch_to_buffer( struct yy_buffer_state* new_buffer ) = 0;

+ virtual struct yy_buffer_state*

+ yy_create_buffer( istream* s, int size ) = 0;

+ virtual void yy_delete_buffer( struct yy_buffer_state* b ) = 0;

+ virtual void yyrestart( istream* s ) = 0;

+ virtual int yylex() = 0;

+protected:

+ char* yytext;

+ int yyleng;

+};

+class yyFlexLexer : public FlexLexer {

+public:

+ // arg_yyin and arg_yyout default to the cin and cout, but we

+ // only make that assignment when initializing in yylex().

+ yyFlexLexer( istream* arg_yyin = 0, ostream* arg_yyout = 0 )

+ {

+ yyin = arg_yyin;

+ yyout = arg_yyout;

+ yy_c_buf_p = 0;

+ yy_init = 1;

+ yy_start = 0;

+ yy_did_buffer_switch_on_eof = 0;

+ yy_looking_for_trail_begin = 0;

+ yy_more_flag = 0;

+ yy_more_len = 0;

+ yy_start_stack_ptr = yy_start_stack_depth = 0;

+ yy_start_stack = 0;

+ yy_current_buffer = 0;

+#ifdef YY_USES_REJECT

+ yy_state_buf = new yy_state_type[YY_BUF_SIZE + 2];

+#else

+ yy_state_buf = 0;

+#endif

+ }

+ virtual ~yyFlexLexer()

+ {

+ delete yy_state_buf;

+ }

+ void yy_switch_to_buffer( struct yy_buffer_state* new_buffer );

+ struct yy_buffer_state* yy_create_buffer( istream* s, int size );

+ void yy_delete_buffer( struct yy_buffer_state* b );

+ void yyrestart( istream* s );

+ virtual int yylex();

+protected:

+ virtual int LexerInput( char* buf, int max_size );

+ virtual void LexerOutput( const char* buf, int size );

+ virtual void LexerError( const char* msg );

+ void yyunput( int c, char* buf_ptr );

+ int yyinput();

+ void yy_load_buffer_state();

+ void yy_init_buffer( struct yy_buffer_state* b, istream* s );

+ int yy_start_stack_ptr;

+ int yy_start_stack_depth;

+ int* yy_start_stack;

+ void yy_push_state( int new_state );

+ void yy_pop_state();

+ int yy_top_state();

+ yy_state_type yy_get_previous_state();

+ yy_state_type yy_try_NUL_trans( yy_state_type current_state );

+ int yy_get_next_buffer();

+ istream* yyin; // input source for default LexerInput

+ ostream* yyout; // output sink for default LexerOutput

+ struct yy_buffer_state* yy_current_buffer;

+ // yy_hold_char holds the character lost when yytext is formed.

+ char yy_hold_char;

+ // Number of characters read into yy_ch_buf.

+ int yy_n_chars;

+ // Points to current character in buffer.

+ char* yy_c_buf_p;

+ int yy_init; // whether we need to initialize

+ int yy_start; // start state number

+ // Flag which is used to allow yywrap()'s to do buffer switches

+ // instead of setting up a fresh yyin. A bit of a hack ...

+ int yy_did_buffer_switch_on_eof;

+ // The following are not always needed, but may be depending

+ // on use of certain flex features (like REJECT or yymore()).

+ yy_state_type yy_last_accepting_state;

+ char* yy_last_accepting_cpos;

+ yy_state_type* yy_state_buf;

+ yy_state_type* yy_state_ptr;

+ char* yy_full_match;

+ int* yy_full_state;

+ int yy_full_lp;

+ int yy_lp;

+ int yy_looking_for_trail_begin;

+ int yy_more_flag;

+ int yy_more_len;

+};

+#endif

diff --git a/usr.bin/lex/Makefile b/usr.bin/lex/Makefile
new file mode 100644
index 000000000000..7f88e6eea4de
--- /dev/null
+++ b/usr.bin/lex/Makefile

@@ -0,0 +1,57 @@

+# $Id$

+# By default, flex will be configured to generate 8-bit scanners only if the

+# -8 flag is given. If you want it to always generate 8-bit scanners, add

+# "-DDEFAULT_CSIZE=256" to CFLAGS. Note that doing so will double the size

+# of all uncompressed scanners.

+# Bootstrapping of lex is handled automatically.

+# ALso note that flex.skel no longer gets installed.

+# XXX Todo:

+# Install as lex++, and install FlexLexer.h

+PROG= lex

+LINKS= ${BINDIR}/lex ${BINDIR}/flex

+#LINKS+= ${BINDIR}/lex ${BINDIR}/lex++ ${BINDIR}/flex ${BINDIR}/flex++

+SRCS= ccl.c dfa.c ecs.c gen.c main.c misc.c nfa.c parse.y \

+ skel.c sym.c tblcmp.c yylex.c

+OBJS+= scan.o

+LFLAGS+= -is

+CFLAGS+= -I. -I${.CURDIR}

+MAN1= flex.1 flexdoc.1

+MLINKS= flex.1 lex.1 flexdoc.1 lexdoc.1

+CLEANFILES+= parse.c parse.h scan.c y.tab.h

+SUBDIR= lib

+.depend: parse.h

+parse.c parse.h: parse.y

+ $(YACC) -d $(.CURDIR)/parse.y

+ mv y.tab.c parse.c

+ mv y.tab.h parse.h

+.if exists(/usr/bin/lex)

+scan.o: parse.c

+.else

+# We must bootstrap

+scan.o: scan.c parse.h

+scan.c:

+ @echo "Bootstrapping flex"

+ @rm -f scan.c

+ @cp -pf ${.CURDIR}/initscan.c scan.c

+.endif

+test: check

+check: $(PROG)

+ ./$(PROG) $(LFLAGS) -t $(COMPRESSION) $(.CURDIR)/scan.l \

+ | sed s,\"$(.CURDIR)/scan.l",\"scan.l", \

+ | diff $(.CURDIR)/initscan.c -

+ @echo "Check successful"

+.include <bsd.prog.mk>

diff --git a/usr.bin/lex/NEWS b/usr.bin/lex/NEWS
new file mode 100644
index 000000000000..aff90a392a55
--- /dev/null
+++ b/usr.bin/lex/NEWS

@@ -0,0 +1,703 @@

+Changes between release 2.4.7 (03Aug94) and release 2.4.6:

+ - Fixed serious bug in reading multiple files.

+ - Fixed bug in scanning NUL's.

+ - Fixed bug in input() returning 8-bit characters.

+ - Fixed bug in matching text with embedded NUL's when

+ using %array or lex compatibility.

+ - Fixed multiple invocations of YY_USER_ACTION when using '|'

+ continuation action.

+ - Minor prototyping fixes.

+Changes between release 2.4.6 (04Jan94) and release 2.4.5:

+ - Linking with -lfl no longer required if your program includes

+ its own yywrap() and main() functions. (This change will cause

+ problems if you have a non-ANSI compiler on a system for which

+ sizeof(int) != sizeof(void*) or sizeof(int) != sizeof(size_t).)

+ - The use of 'extern "C++"' in FlexLexer.h has been modified to

+ get around an incompatibility with g++'s header files.

+Changes between release 2.4.5 (11Dec93) and release 2.4.4:

+ - Fixed bug breaking C++ scanners that use REJECT or variable

+ trailing context.

+ - Fixed serious input problem for interactive scanners on

+ systems for which char is unsigned.

+ - Fixed bug in incorrectly treating '$' operator as variable

+ trailing context.

+ - Fixed bug in -CF table representation that could lead to

+ corrupt tables.

+ - Fixed fairly benign memory leak.

+ - Added `extern "C++"' wrapper to FlexLexer.h header. This

+ should overcome the g++ 2.5.X problems mentioned in the

+ NEWS for release 2.4.3.

+ - Changed #include of FlexLexer.h to use <> instead of "".

+ - Added feature to control whether the scanner attempts to

+ refill the input buffer once it's exhausted. This feature

+ will be documented in the 2.5 release.

+Changes between release 2.4.4 (07Dec93) and release 2.4.3:

+ - Fixed two serious bugs in scanning 8-bit characters.

+ - Fixed bug in YY_USER_ACTION that caused it to be executed

+ inappropriately (on the scanner's own internal actions, and

+ with incorrect yytext/yyleng values).

+ - Fixed bug in pointing yyin at a new file and resuming scanning.

+ - Portability fix regarding min/max/abs macros conflicting with

+ function definitions in standard header files.

+ - Added a virtual LexerError() method to the C++ yyFlexLexer class

+ for reporting error messages instead of always using cerr.

+ - Added warning in flexdoc that the C++ scanning class is presently

+ experimental and subject to considerable change between major

+ releases.

+Changes between release 2.4.3 (03Dec93) and release 2.4.2:

+ - Fixed bug causing fatal scanner messages to fail to print.

+ - Fixed things so FlexLexer.h can be included in other C++

+ sources. One side-effect of this change is that -+ and -CF

+ are now incompatible.

+ - libfl.a now supplies private versions of the the <string.h>/

+ <strings.h> string routines needed by flex and the scanners

+ it generates, to enhance portability to some BSD systems.

+ - More robust solution to 2.4.2's flexfatal() bug fix.

+ - Added ranlib of installed libfl.a.

+ - Some lint tweaks.

+ - NOTE: problems have been encountered attempting to build flex

+ C++ scanners using g++ version 2.5.X. The problem is due to an

+ unfortunate heuristic in g++ 2.5.X that attempts to discern between

+ C and C++ headers. Because FlexLexer.h is installed (by default)

+ in /usr/local/include and not /usr/local/lib/g++-include, g++ 2.5.X

+ decides that it's a C header :-(. So if you have problems, install

+ the header in /usr/local/lib/g++-include instead.

+Changes between release 2.4.2 (01Dec93) and release 2.4.1:

+ - Fixed bug in libfl.a referring to non-existent "flexfatal" function.

+ - Modified to produce both compress'd and gzip'd tar files for

+ distributions (you probably don't care about this change!).

+Changes between release 2.4.1 (30Nov93) and release 2.3.8:

+ - The new '-+' flag instructs flex to generate a C++ scanner class

+ (thanks to Kent Williams). flex writes an implementation of the

+ class defined in FlexLexer.h to lex.yy.cc. You may include

+ multiple scanner classes in your program using the -P flag. Note

+ that the scanner class also provides a mechanism for creating

+ reentrant scanners. The scanner class uses C++ streams for I/O

+ instead of FILE*'s (thanks to Tom Epperly). If the flex executable's

+ name ends in '+' then the '-+' flag is automatically on, so creating

+ a symlink or copy of "flex" to "flex++" results in a version of

+ flex that can be used exclusively for C++ scanners.

+ Note that without the '-+' flag, flex-generated scanners can still

+ be compiled using C++ compilers, though they use FILE*'s for I/O

+ instead of streams.

+ See the "GENERATING C++ SCANNERS" section of flexdoc for details.

+ - The new '-l' flag turns on maximum AT&T lex compatibility. In

+ particular, -l includes support for "yylineno" and makes yytext

+ be an array instead of a pointer. It does not, however, do away

+ with all incompatibilities. See the "INCOMPATIBILITIES WITH LEX

+ AND POSIX" section of flexdoc for details.

+ - The new '-P' option specifies a prefix to use other than "yy"

+ for the scanner's globally-visible variables, and for the

+ "lex.yy.c" filename. Using -P you can link together multiple

+ flex scanners in the same executable.

+ - The distribution includes a "texinfo" version of flexdoc.1,

+ contributed by Roland Pesch (thanks also to Marq Kole, who

+ contributed another version). It has not been brought up to

+ date, but reflects version 2.3. See MISC/flex.texinfo.

+ The flex distribution will soon include G.T. Nicol's flex

+ manual; he is presently bringing it up-to-date for version 2.4.

+ - yywrap() is now a function, and you now *must* link flex scanners

+ with libfl.a.

+ - Site-configuration is now done via an autoconf-generated

+ "configure" script contributed by Francois Pinard.

+ - Scanners now use fread() (or getc(), if interactive) and not

+ read() for input. A new "table compression" option, -Cr,

+ overrides this change and causes the scanner to use read()

+ (because read() is a bit faster than fread()). -f and -F

+ are now equivalent to -Cfr and -CFr; i.e., they imply the

+ -Cr option.

+ - In the blessed name of POSIX compliance, flex supports "%array"

+ and "%pointer" directives in the definitions (first) section of

+ the scanner specification. The former specifies that yytext

+ should be an array (of size YYLMAX), the latter, that it should

+ be a pointer. The array version of yytext is universally slower

+ than the pointer version, but has the advantage that its contents

+ remain unmodified across calls to input() and unput() (the pointer

+ version of yytext is, still, trashed by such calls).

+ "%array" cannot be used with the '-+' C++ scanner class option.

+ - The new '-Ca' option directs flex to trade off memory for

+ natural alignment when generating a scanner's tables. In

+ particular, table entries that would otherwise be "short"

+ become "long".

+ - The new '-h' option produces a summary of the flex flags.

+ - The new '-V' option reports the flex version number and exits.

+ - The new scanner macro YY_START returns an integer value

+ corresponding to the current start condition. You can return

+ to that start condition by passing the value to a subsequent

+ "BEGIN" action. You also can implement "start condition stacks"

+ by storing the values in an integer stack.

+ - You can now redefine macros such as YY_INPUT by just #define'ing

+ them to some other value in the first section of the flex input;

+ no need to first #undef them.

+ - flex now generates warnings for rules that can't be matched.

+ These warnings can be turned off using the new '-w' flag. If

+ your scanner uses REJECT then you will not get these warnings.

+ - If you specify the '-s' flag but the default rule can be matched,

+ flex now generates a warning.

+ - "yyleng" is now a global, and may be modified by the user (though

+ doing so and then using yymore() will yield weird results).

+ - Name definitions in the first section of a scanner specification

+ can now include a leading '^' or trailing '$' operator. In this

+ case, the definition is *not* pushed back inside of parentheses.

+ - Scanners with compressed tables are now "interactive" (-I option)

+ by default. You can suppress this attribute (which makes them

+ run slightly slower) using the new '-B' flag.

+ - Flex now generates 8-bit scanners by default, unless you use the

+ -Cf or -CF compression options (-Cfe and -CFe result in 8-bit

+ scanners). You can force it to generate a 7-bit scanner using

+ the new '-7' flag. You can build flex to generate 8-bit scanners

+ for -Cf and -CF, too, by adding -DDEFAULT_CSIZE=256 to CFLAGS

+ in the Makefile.

+ - You no longer need to call the scanner routine yyrestart() to

+ inform the scanner that you have switched to a new file after

+ having seen an EOF on the current input file. Instead, just

+ point yyin at the new file and continue scanning.

+ - You no longer need to invoke YY_NEW_FILE in an <<EOF>> action

+ to indicate you wish to continue scanning. Simply point yyin

+ at a new file.

+ - A leading '#' no longer introduces a comment in a flex input.

+ - flex no longer considers formfeed ('\f') a whitespace character.

+ - %t, I'm happy to report, has been nuked.

+ - The '-p' option may be given twice ('-pp') to instruct flex to

+ report minor performance problems as well as major ones.

+ - The '-v' verbose output no longer includes start/finish time

+ information.

+ - Newlines in flex inputs can optionally include leading or

+ trailing carriage-returns ('\r'), in support of several PC/Mac

+ run-time libraries that automatically include these.

+ - A start condition of the form "<*>" makes the following rule

+ active in every start condition, whether exclusive or inclusive.

+ - The following items have been corrected in the flex documentation:

+ - '-C' table compression options *are* cumulative.

+ - You may modify yytext but not lengthen it by appending

+ characters to the end. Modifying its final character

+ will affect '^' anchoring for the next rule matched

+ if the character is changed to or from a newline.

+ - The term "backtracking" has been renamed "backing up",

+ since it is a one-time repositioning and not a repeated

+ search. What used to be the "lex.backtrack" file is now

+ "lex.backup".

+ - Unindented "/* ... */" comments are allowed in the first

+ flex input section, but not in the second.

+ - yyless() can only be used in the flex input source, not

+ externally.

+ - You can use "yyrestart(yyin)" to throw away the

+ current contents of the input buffer.

+ - To write high-speed scanners, attempt to match as much

+ text as possible with each rule. See MISC/fastwc/README

+ for more information.

+ - Using the beginning-of-line operator ('^') is fairly

+ cheap. Using unput() is expensive. Using yyless() is

+ cheap.

+ - An example of scanning strings with embedded escape

+ sequences has been added.

+ - The example of backing-up in flexdoc was erroneous; it

+ has been corrected.

+ - A flex scanner's internal buffer now dynamically grows if needed

+ to match large tokens. Note that growing the buffer presently

+ requires rescanning the (large) token, so consuming a lot of

+ text this way is a slow process. Also note that presently the

+ buffer does *not* grow if you unput() more text than can fit

+ into the buffer.

+ - The MISC/ directory has been reorganized; see MISC/README for

+ details.

+ - yyless() can now be used in the third (user action) section

+ of a scanner specification, thanks to Ceriel Jacobs. yyless()

+ remains a macro and cannot be used outside of the scanner source.

+ - The skeleton file is no longer opened at run-time, but instead

+ compiled into a large string array (thanks to John Gilmore and

+ friends at Cygnus). You can still use the -S flag to point flex

+ at a different skeleton file, though if you use this option let

+ me know, as I plan to otherwise do away with -S in the near

+ future.

+ - flex no longer uses a temporary file to store the scanner's

+ actions.

+ - A number of changes have been made to decrease porting headaches.

+ In particular, flex no longer uses memset() or ctime(), and

+ provides a single simple mechanism for dealing with C compilers

+ that still define malloc() as returning char* instead of void*.

+ - Flex now detects if the scanner specification requires the -8 flag

+ but the flag was not given or on by default.

+ - A number of table-expansion fencepost bugs have been fixed,

+ making flex more robust for generating large scanners.

+ - flex more consistently identifies the location of errors in

+ its input.

+ - YY_USER_ACTION is now invoked only for "real" actions, not for

+ internal actions used by the scanner for things like filling

+ the buffer or handling EOF.

+ - The rule "[^]]" now matches any character other than a ']';

+ formerly it matched any character at all followed by a ']'.

+ This change was made for compatibility with AT&T lex.

+ - A large number of miscellaneous bugs have been found and fixed

+ thanks to Gerhard Wilhelms.

+ - The source code has been heavily reformatted, making patches

+ relative to previous flex releases no longer accurate.

+Changes between 2.3 Patch #8 (21Feb93) and 2.3 Patch #7:

+ - Fixed bugs in dynamic memory allocation leading to grievous

+ fencepost problems when generating large scanners.

+ - Fixed bug causing infinite loops on character classes with 8-bit

+ characters in them.

+ - Fixed bug in matching repetitions with a lower bound of 0.

+ - Fixed bug in scanning NUL characters using an "interactive" scanner.

+ - Fixed bug in using yymore() at the end of a file.

+ - Fixed bug in misrecognizing rules with variable trailing context.

+ - Fixed bug compiling flex on Suns using gcc 2.

+ - Fixed bug in not recognizing that input files with the character

+ ASCII 128 in them require the -8 flag.

+ - Fixed bug that could cause an infinite loop writing out

+ error messages.

+ - Fixed bug in not recognizing old-style lex % declarations if

+ followed by a tab instead of a space.

+ - Fixed potential crash when flex terminated early (usually due

+ to a bad flag) and the -v flag had been given.

+ - Added some missing declarations of void functions.

+ - Changed to only use '\a' for __STDC__ compilers.

+ - Updated mailing addresses.

+Changes between 2.3 Patch #7 (28Mar91) and 2.3 Patch #6:

+ - Fixed out-of-bounds array access that caused bad tables

+ to be produced on machines where the bad reference happened

+ to yield a 1. This caused problems installing or running

+ flex on some Suns, in particular.

+Changes between 2.3 Patch #6 (29Aug90) and 2.3 Patch #5:

+ - Fixed a serious bug in yymore() which basically made it

+ completely broken. Thanks goes to Jean Christophe of

+ the Nethack development team for finding the problem

+ and passing along the fix.

+Changes between 2.3 Patch #5 (16Aug90) and 2.3 Patch #4:

+ - An up-to-date version of initscan.c so "make test" will

+ work after applying the previous patches

+Changes between 2.3 Patch #4 (14Aug90) and 2.3 Patch #3:

+ - Fixed bug in hexadecimal escapes which allowed only digits,

+ not letters, in escapes

+ - Fixed bug in previous "Changes" file!

+Changes between 2.3 Patch #3 (03Aug90) and 2.3 Patch #2:

+ - Correction to patch #2 for gcc compilation; thanks goes to

+ Paul Eggert for catching this.

+Changes between 2.3 Patch #2 (02Aug90) and original 2.3 release:

+ - Fixed (hopefully) headaches involving declaring malloc()

+ and free() for gcc, which defines __STDC__ but (often) doesn't

+ come with the standard include files such as <stdlib.h>.

+ Reordered #ifdef maze in the scanner skeleton in the hope of

+ getting the declarations right for cfront and g++, too.

+ - Note that this patch supercedes patch #1 for release 2.3,

+ which was never announced but was available briefly for

+ anonymous ftp.

+Changes between 2.3 (full) release of 28Jun90 and 2.2 (alpha) release:

+ User-visible:

+ - A lone <<EOF>> rule (that is, one which is not qualified with

+ a list of start conditions) now specifies the EOF action for

+ *all* start conditions which haven't already had <<EOF>> actions

+ given. To specify an end-of-file action for just the initial

+ state, use <INITIAL><<EOF>>.

+ - -d debug output is now contigent on the global yy_flex_debug

+ being set to a non-zero value, which it is by default.

+ - A new macro, YY_USER_INIT, is provided for the user to specify

+ initialization action to be taken on the first call to the

+ scanner. This action is done before the scanner does its

+ own initialization.

+ - yy_new_buffer() has been added as an alias for yy_create_buffer()

+ - Comments beginning with '#' and extending to the end of the line

+ now work, but have been deprecated (in anticipation of making

+ flex recognize #line directives).

+ - The funky restrictions on when semi-colons could follow the

+ YY_NEW_FILE and yyless macros have been removed. They now

+ behave identically to functions.

+ - A bug in the sample redefinition of YY_INPUT in the documentation

+ has been corrected.

+ - A bug in the sample simple tokener in the documentation has

+ been corrected.

+ - The documentation on the incompatibilities between flex and

+ lex has been reordered so that the discussion of yylineno

+ and input() come first, as it's anticipated that these will

+ be the most common source of headaches.

+ Things which didn't used to be documented but now are:

+ - flex interprets "^foo|bar" differently from lex. flex interprets

+ it as "match either a 'foo' or a 'bar', providing it comes at the

+ beginning of a line", whereas lex interprets it as "match either

+ a 'foo' at the beginning of a line, or a 'bar' anywhere".

+ - flex initializes the global "yyin" on the first call to the

+ scanner, while lex initializes it at compile-time.

+ - yy_switch_to_buffer() can be used in the yywrap() macro/routine.

+ - flex scanners do not use stdio for their input, and hence when

+ writing an interactive scanner one must explictly call fflush()

+ after writing out a prompt.

+ - flex scanner can be made reentrant (after a fashion) by using

+ "yyrestart( yyin );". This is useful for interactive scanners

+ which have interrupt handlers that long-jump out of the scanner.

+ - a defense of why yylineno is not supported is included, along

+ with a suggestion on how to convert scanners which rely on it.

+ Other changes:

+ - Prototypes and proper declarations of void routines have

+ been added to the flex source code, courtesy of Kevin B. Kenny.

+ - Routines dealing with memory allocation now use void* pointers

+ instead of char* - see Makefile for porting implications.

+ - Error-checking is now done when flex closes a file.

+ - Various lint tweaks were added to reduce the number of gripes.

+ - Makefile has been further parameterized to aid in porting.

+ - Support for SCO Unix added.

+ - Flex now sports the latest & greatest UC copyright notice

+ (which is only slightly different from the previous one).

+ - A note has been added to flexdoc.1 mentioning work in progress

+ on modifying flex to generate straight C code rather than a

+ table-driven automaton, with an email address of whom to contact

+ if you are working along similar lines.

+Changes between 2.2 Patch #3 (30Mar90) and 2.2 Patch #2:

+ - fixed bug which caused -I scanners to bomb

+Changes between 2.2 Patch #2 (27Mar90) and 2.2 Patch #1:

+ - fixed bug writing past end of input buffer in yyunput()

+ - fixed bug detecting NUL's at the end of a buffer

+Changes between 2.2 Patch #1 (23Mar90) and 2.2 (alpha) release:

+ - Makefile fixes: definition of MAKE variable for systems

+ which don't have it; installation of flexdoc.1 along with

+ flex.1; fixed two bugs which could cause "bigtest" to fail.

+ - flex.skel fix for compiling with g++.

+ - README and flexdoc.1 no longer list an out-of-date BITNET address

+ for contacting me.

+ - minor typos and formatting changes to flex.1 and flexdoc.1.

+Changes between 2.2 (alpha) release of March '90 and previous release:

+ User-visible:

+ - Full user documentation now available.

+ - Support for 8-bit scanners.

+ - Scanners now accept NUL's.

+ - A facility has been added for dealing with multiple

+ input buffers.

+ - Two manual entries now. One which fully describes flex

+ (rather than just its differences from lex), and the

+ other for quick(er) reference.

+ - A number of changes to bring flex closer into compliance

+ with the latest POSIX lex draft:

+ %t support

+ flex now accepts multiple input files and concatenates

+ them together to form its input

+ previous -c (compress) flag renamed -C

+ do-nothing -c and -n flags added

+ Any indented code or code within %{}'s in section 2 is

+ now copied to the output

+ - yyleng is now a bona fide global integer.

+ - -d debug information now gives the line number of the

+ matched rule instead of which number rule it was from

+ the beginning of the file.

+ - -v output now includes a summary of the flags used to generate

+ the scanner.

+ - unput() and yyrestart() are now globally callable.

+ - yyrestart() no longer closes the previous value of yyin.

+ - C++ support; generated scanners can be compiled with C++ compiler.

+ - Primitive -lfl library added, containing default main()

+ which calls yylex(). A number of routines currently living

+ in the scanner skeleton will probably migrate to here

+ in the future (in particular, yywrap() will probably cease

+ to be a macro and instead be a function in the -lfl library).

+ - Hexadecimal (\x) escape sequences added.

+ - Support for MS-DOS, VMS, and Turbo-C integrated.

+ - The %used/%unused operators have been deprecated. They

+ may go away soon.

+ Other changes:

+ - Makefile enhanced for easier testing and installation.

+ - The parser has been tweaked to detect some erroneous

+ constructions which previously were missed.

+ - Scanner input buffer overflow is now detected.

+ - Bugs with missing "const" declarations fixed.

+ - Out-of-date Minix/Atari patches provided.

+ - Scanners no longer require printf() unless FLEX_DEBUG is being used.

+ - A subtle input() bug has been fixed.

+ - Line numbers for "continued action" rules (those following

+ the special '|' action) are now correct.

+ - unput() bug fixed; had been causing problems porting flex to VMS.

+ - yymore() handling rewritten to fix bug with interaction

+ between yymore() and trailing context.

+ - EOF in actions now generates an error message.

+ - Bug involving -CFe and generating equivalence classes fixed.

+ - Bug which made -CF be treated as -Cf fixed.

+ - Support for SysV tmpnam() added.

+ - Unused #define's for scanner no longer generated.

+ - Error messages which are associated with a particular input

+ line are now all identified with their input line in standard

+ format.

+ - % directives which are valid to lex but not to flex are

+ now ignored instead of generating warnings.

+ - -DSYS_V flag can now also be specified -DUSG for System V

+ compilation.

+Changes between 2.1 beta-test release of June '89 and previous release:

+ User-visible:

+ - -p flag generates a performance report to stderr. The report

+ consists of comments regarding features of the scanner rules

+ which result in slower scanners.

+ - -b flag generates backtracking information to lex.backtrack.

+ This is a list of scanner states which require backtracking

+ and the characters on which they do so. By adding rules

+ one can remove backtracking states. If all backtracking states

+ are eliminated, the generated scanner will run faster.

+ Backtracking is not yet documented in the manual entry.

+ - Variable trailing context now works, i.e., one can have

+ rules like "(foo)*/[ \t]*bletch". Some trailing context

+ patterns still cannot be properly matched and generate

+ error messages. These are patterns where the ending of the

+ first part of the rule matches the beginning of the second

+ part, such as "zx*/xy*", where the 'x*' matches the 'x' at

+ the beginning of the trailing context. Lex won't get these

+ patterns right either.

+ - Faster scanners.

+ - End-of-file rules. The special rule "<<EOF>>" indicates

+ actions which are to be taken when an end-of-file is

+ encountered and yywrap() returns non-zero (i.e., indicates

+ no further files to process). See manual entry for example.

+ - The -r (reject used) flag is gone. flex now scans the input

+ for occurrences of the string "REJECT" to determine if the

+ action is needed. It tries to be intelligent about this but

+ can be fooled. One can force the presence or absence of

+ REJECT by adding a line in the first section of the form

+ "%used REJECT" or "%unused REJECT".

+ - yymore() has been implemented. Similarly to REJECT, flex

+ detects the use of yymore(), which can be overridden using

+ "%used" or "%unused".

+ - Patterns like "x{0,3}" now work (i.e., with lower-limit == 0).

+ - Removed '\^x' for ctrl-x misfeature.

+ - Added '\a' and '\v' escape sequences.

+ - \<digits> now works for octal escape sequences; previously

+ \0<digits> was required.

+ - Better error reporting; line numbers are associated with rules.

+ - yyleng is a macro; it cannot be accessed outside of the

+ scanner source file.

+ - yytext and yyleng should not be modified within a flex action.

+ - Generated scanners #define the name FLEX_SCANNER.

+ - Rules are internally separated by YY_BREAK in lex.yy.c rather

+ than break, to allow redefinition.

+ - The macro YY_USER_ACTION can be redefined to provide an action

+ which is always executed prior to the matched rule's action.

+ - yyrestart() is a new action which can be used to restart

+ the scanner after it has seen an end-of-file (a "real" one,

+ that is, one for which yywrap() returned non-zero). It takes

+ a FILE* argument indicating a new file to scan and sets

+ things up so that a subsequent call to yylex() will start

+ scanning that file.

+ - Internal scanner names all preceded by "yy_"

+ - lex.yy.c is deleted if errors are encountered during processing.

+ - Comments may be put in the first section of the input by preceding

+ them with '#'.

+ Other changes:

+ - Some portability-related bugs fixed, in particular for machines

+ with unsigned characters or sizeof( int* ) != sizeof( int ).

+ Also, tweaks for VMS and Microsoft C (MS-DOS), and identifiers all

+ trimmed to be 31 or fewer characters. Shortened file names

+ for dinosaur OS's. Checks for allocating > 64K memory

+ on 16 bit'ers. Amiga tweaks. Compiles using gcc on a Sun-3.

+ - Compressed and fast scanner skeletons merged.

+ - Skeleton header files done away with.

+ - Generated scanner uses prototypes and "const" for __STDC__.

+ - -DSV flag is now -DSYS_V for System V compilation.

+ - Removed all references to FTL language.

+ - Software now covered by BSD Copyright.

+ - flex will replace lex in subsequent BSD releases.

diff --git a/usr.bin/lex/README b/usr.bin/lex/README
new file mode 100644
index 000000000000..339e9bbbd51e
--- /dev/null
+++ b/usr.bin/lex/README

@@ -0,0 +1,67 @@

+This is release 2.4 of flex. See "version.h" for the exact patch-level.

+See the file "NEWS" to find out what is new in this Flex release.

+Read the file "INSTALL" for general installation directives. Peek near

+the beginning of the file "Makefile.in" for special DEFS values. On most

+systems, you can just run the "configure" script and type "make" to build

+flex; then "make check" to test whether it built correctly; and if it did,

+then "make install" to install it.

+If you're feeling adventurous, you can also issue "make bigcheck" (be

+prepared to wait a while).

+Note that flex is distributed under a copyright very similar to that of

+BSD Unix, and not under the GNU General Public License (GPL), except for

+the "configure" script, which is covered by the GPL.

+Many thanks to the 2.4 pre-testers for finding a bunch of bugs and helping

+increase/test portability: Francois Pinard, Nathan Zelle, Gavin Nicol,

+Chris Thewalt, and Matthew Jacob.

+Please send bug reports and feedback to:

+ Vern Paxson

+ ICSD, 46A/1123

+ Lawrence Berkeley Laboratory

+ 1 Cyclotron Rd.

+ Berkeley, CA 94720

+ vern@ee.lbl.gov

+The flex distribution consists of the following files:

+ README This message

+ NEWS Differences between the various releases

+ INSTALL General installation information

+ COPYING flex's copyright

+ configure.in, configure, Makefile.in, install.sh, mkinstalldirs

+ elements of the "autoconf" auto-configuration process

+ flexdef.h, parse.y, scan.l, ccl.c, dfa.c, ecs.c, gen.c, main.c,

+ misc.c, nfa.c, sym.c, tblcmp.c, yylex.c

+ source files

+ version.h version of this flex release

+ flex.skl flex scanner skeleton

+ mkskel.sh script for converting flex.skl to C source file skel.c

+ liballoc.c

+ libmain.c flex library (-lfl) sources

+ libyywrap.c

+ initscan.c pre-flex'd version of scan.l

+ FlexLexer.h header file for C++ lexer class

+ flexdoc.1 full user documentation

+ flex.1 reference documentation

+ MISC/ a directory containing miscellaneous contributions.

+ See MISC/README for details.

diff --git a/usr.bin/lex/ccl.c b/usr.bin/lex/ccl.c
new file mode 100644
index 000000000000..fe28463923e0
--- /dev/null
+++ b/usr.bin/lex/ccl.c

@@ -0,0 +1,149 @@

+/* ccl - routines for character classes */

+/*-

+ *

+ * This code is derived from software contributed to Berkeley by

+ * Vern Paxson.

+ *

+ * The United States Government has rights in this work pursuant

+ * to contract no. DE-AC03-76SF00098 between the United States

+ * Department of Energy and the University of California.

+ *

+ * Redistribution and use in source and binary forms are permitted provided

+ * that: (1) source distributions retain this entire copyright notice and

+ * comment, and (2) distributions including binaries display the following

+ * acknowledgement: ``This product includes software developed by the

+ * University of California, Berkeley and its contributors'' in the

+ * documentation or other materials provided with the distribution and in

+ * all advertising materials mentioning features or use of this software.

+ * Neither the name of the University nor the names of its contributors may

+ * be used to endorse or promote products derived from this software without

+ * specific prior written permission.

+ * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR IMPLIED

+ * WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED WARRANTIES OF

+ * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.

+ */

+/* $Header: /home/daffy/u0/vern/flex/RCS/ccl.c,v 2.9 93/09/16 20:32:14 vern Exp $ */

+#include "flexdef.h"

+/* ccladd - add a single character to a ccl */

+void ccladd( cclp, ch )

+int cclp;

+int ch;

+ {

+ int ind, len, newpos, i;

+ check_char( ch );

+ len = ccllen[cclp];

+ ind = cclmap[cclp];

+ /* check to see if the character is already in the ccl */

+ for ( i = 0; i < len; ++i )

+ if ( ccltbl[ind + i] == ch )

+ return;

+ newpos = ind + len;

+ if ( newpos >= current_max_ccl_tbl_size )

+ {

+ current_max_ccl_tbl_size += MAX_CCL_TBL_SIZE_INCREMENT;

+ ++num_reallocs;

+ ccltbl = reallocate_Character_array( ccltbl,

+ current_max_ccl_tbl_size );

+ }

+ ccllen[cclp] = len + 1;

+ ccltbl[newpos] = ch;

+ }

+/* cclinit - return an empty ccl */

+int cclinit()

+ {

+ if ( ++lastccl >= current_maxccls )

+ {

+ current_maxccls += MAX_CCLS_INCREMENT;

+ ++num_reallocs;

+ cclmap = reallocate_integer_array( cclmap, current_maxccls );

+ ccllen = reallocate_integer_array( ccllen, current_maxccls );

+ cclng = reallocate_integer_array( cclng, current_maxccls );

+ }

+ if ( lastccl == 1 )

+ /* we're making the first ccl */

+ cclmap[lastccl] = 0;

+ else

+ /* The new pointer is just past the end of the last ccl.

+ * Since the cclmap points to the \first/ character of a

+ * ccl, adding the length of the ccl to the cclmap pointer

+ * will produce a cursor to the first free space.

+ */

+ cclmap[lastccl] = cclmap[lastccl - 1] + ccllen[lastccl - 1];

+ ccllen[lastccl] = 0;

+ cclng[lastccl] = 0; /* ccl's start out life un-negated */

+ return lastccl;

+ }

+/* cclnegate - negate the given ccl */

+void cclnegate( cclp )

+int cclp;

+ {

+ cclng[cclp] = 1;

+ }

+/* list_character_set - list the members of a set of characters in CCL form

+ *

+ * Writes to the given file a character-class representation of those

+ * characters present in the given CCL. A character is present if it

+ * has a non-zero value in the cset array.

+ */

+void list_character_set( file, cset )

+FILE *file;

+int cset[];

+ {

+ register int i;

+ putc( '[', file );

+ for ( i = 0; i < csize; ++i )

+ {

+ if ( cset[i] )

+ {

+ register int start_char = i;

+ putc( ' ', file );

+ fputs( readable_form( i ), file );

+ while ( ++i < csize && cset[i] )

+ ;

+ if ( i - 1 > start_char )

+ /* this was a run */

+ fprintf( file, "-%s", readable_form( i - 1 ) );

+ putc( ' ', file );

+ }

+ putc( ']', file );

+ }

diff --git a/usr.bin/lex/dfa.c b/usr.bin/lex/dfa.c
new file mode 100644
index 000000000000..f8fceb975acd
--- /dev/null
+++ b/usr.bin/lex/dfa.c

@@ -0,0 +1,1085 @@

+/* dfa - DFA construction routines */