⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 push.fb.c

📁 a little DFA compiler.
💻 C
字号:
/* Generated by re2c */#line 1 "push.fb.re"/* *  A push-model scanner example for re2c -f *  Written Mon Apr 11 2005 by mgix@mgix.com *  This file is in the public domain. * */// ----------------------------------------------------------------------#include <fcntl.h>#include <stdio.h>#include <stddef.h>#include <stdlib.h>#include <string.h>#if defined(WIN32)    typedef signed char     int8_t;    typedef signed short    int16_t;    typedef signed int      int32_t;    typedef unsigned char   uint8_t;    typedef unsigned short  uint16_t;    typedef unsigned int    uint32_t;#else    #include <stdint.h>    #include <unistd.h>    #ifndef O_BINARY        #define O_BINARY 0    #endif#endif// ----------------------------------------------------------------------#define TOKENS              \                            \    TOK(kEOF)               \    TOK(kEOL)               \    TOK(kUnknown)           \    TOK(kIdentifier)        \    TOK(kDecimalConstant)   \                            \    TOK(kEqual)             \    TOK(kLeftParen)         \    TOK(kRightParen)        \    TOK(kMinus)             \    TOK(kPlus)              \    TOK(kStar)              \    TOK(kSlash)             \                            \    TOK(kIf)                \    TOK(kFor)               \    TOK(kElse)              \    TOK(kGoto)              \    TOK(kBreak)             \    TOK(kWhile)             \    TOK(kReturn)            \// ----------------------------------------------------------------------static const char *tokenNames[] ={    #define TOK(x) #x,        TOKENS    #undef TOK};// ----------------------------------------------------------------------class PushScanner{public:    enum Token    {        #define TOK(x) x,            TOKENS        #undef TOK    };private:    bool        eof;    int32_t     state;    uint8_t     *limit;    uint8_t     *start;    uint8_t     *cursor;    uint8_t     *marker;    uint8_t     *buffer;    uint8_t     *bufferEnd;    uint8_t     yych;    uint32_t    yyaccept;public:    // ----------------------------------------------------------------------    PushScanner()    {        limit = 0;        start = 0;        state = -1;        cursor = 0;        marker = 0;        buffer = 0;        eof = false;        bufferEnd = 0;    }    // ----------------------------------------------------------------------    ~PushScanner()    {    }    // ----------------------------------------------------------------------    void send(        Token token    )    {        size_t tokenSize = cursor-start;        const char *tokenName = tokenNames[token];        printf(            "scanner is pushing out a token of type %d (%s)",            token,            tokenName        );        if(token==kEOF) putchar('\n');        else        {            size_t tokenNameSize = strlen(tokenNames[token]);            size_t padSize = 20-(20<tokenNameSize ? 20 : tokenNameSize);            for(size_t i=0; i<padSize; ++i) putchar(' ');            printf(" : ---->");            fwrite(                start,                tokenSize,                1,                stdout            );            printf("<----\n");        }    }    // ----------------------------------------------------------------------    uint32_t push(        const void  *input,        ssize_t     inputSize    )    {        printf(            "scanner is receiving a new data batch of length %d\n"            "scanner continues with saved state = %d\n",            inputSize,            state        );        /*         * Data source is signaling end of file when batch size         * is less than maxFill. This is slightly annoying because         * maxFill is a value that can only be known after re2c does         * its thing. Practically though, maxFill is never bigger than         * the longest keyword, so given our grammar, 32 is a safe bet.         */        uint8_t null[64];        const ssize_t maxFill = 32;        if(inputSize<maxFill)        {            eof = true;            input = null;            inputSize = sizeof(null);            memset(null, 0, sizeof(null));        }        /*         * When we get here, we have a partially         * consumed buffer which is in the following state:         *                                                                last valid char        last valid buffer spot         *                                                                v                      v         * +-------------------+-------------+---------------+-------------+----------------------+         * ^                   ^             ^               ^             ^                      ^         * buffer              start         marker          cursor        limit                  bufferEnd         *          * We need to stretch the buffer and concatenate the new chunk of input to it         *         */        size_t used = limit-buffer;        size_t needed = used+inputSize;        size_t allocated = bufferEnd-buffer;        if(allocated<needed)        {            size_t limitOffset = limit-buffer;            size_t startOffset = start-buffer;            size_t markerOffset = marker-buffer;            size_t cursorOffset = cursor-buffer;                buffer = (uint8_t*)realloc(buffer, needed);                bufferEnd = needed+buffer;            marker = markerOffset + buffer;            cursor = cursorOffset + buffer;            start = buffer + startOffset;            limit = limitOffset + buffer;        }        memcpy(limit, input, inputSize);        limit += inputSize;        // The scanner starts here        #define YYLIMIT         limit        #define YYCURSOR        cursor        #define YYMARKER        marker        #define YYCTYPE         uint8_t        #define SKIP(x)         { start = cursor; goto yy0; }        #define SEND(x)         { send(x); SKIP();          }        #define YYFILL(n)       { goto fill;                }        #define YYGETSTATE()    state        #define YYSETSTATE(x)   { state = (x);  }    start:        {	static const unsigned char yybm[] = {		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		192, 192, 192, 192, 192, 192, 192, 192, 		192, 192,   0,   0,   0,   0,   0,   0, 		  0, 128, 128, 128, 128, 128, 128, 128, 		128, 128, 128, 128, 128, 128, 128, 128, 		128, 128, 128, 128, 128, 128, 128, 128, 		128, 128, 128,   0,   0,   0,   0, 128, 		  0, 128, 128, 128, 128, 128, 128, 128, 		128, 128, 128, 128, 128, 128, 128, 128, 		128, 128, 128, 128, 128, 128, 128, 128, 		128, 128, 128,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 		  0,   0,   0,   0,   0,   0,   0,   0, 	};#line 268 "<stdout>"	{		switch(YYGETSTATE()) {		default: goto yy0;		case 0: goto yyFillLabel0;		case 1: goto yyFillLabel1;		case 2: goto yyFillLabel2;		}yy0:		YYSETSTATE(0);		if((YYLIMIT - YYCURSOR) < 7) YYFILL(7);yyFillLabel0:		yych = *YYCURSOR;		if(yych <= '=') {			if(yych <= '(') {				if(yych <= 0x0A) {					if(yych <= 0x00) goto yy32;					if(yych <= 0x08) goto yy34;					if(yych <= 0x09) goto yy30;					goto yy28;				} else {					if(yych <= 0x1F) {						if(yych <= 0x0D) goto yy30;						goto yy34;					} else {						if(yych <= ' ') goto yy30;						if(yych <= '\'') goto yy34;						goto yy16;					}				}			} else {				if(yych <= '-') {					if(yych <= '*') {						if(yych <= ')') goto yy18;						goto yy24;					} else {						if(yych <= '+') goto yy22;						if(yych <= ',') goto yy34;						goto yy20;					}				} else {					if(yych <= '/') {						if(yych <= '.') goto yy34;						goto yy26;					} else {						if(yych <= '9') goto yy12;						if(yych <= '<') goto yy34;						goto yy14;					}				}			}		} else {			if(yych <= 'e') {				if(yych <= '_') {					if(yych <= '@') goto yy34;					if(yych <= 'Z') goto yy10;					if(yych <= '^') goto yy34;					goto yy10;				} else {					if(yych <= 'a') {						if(yych <= '`') goto yy34;						goto yy10;					} else {						if(yych <= 'b') goto yy7;						if(yych <= 'd') goto yy10;						goto yy5;					}				}			} else {				if(yych <= 'q') {					if(yych <= 'g') {						if(yych <= 'f') goto yy4;						goto yy6;					} else {						if(yych <= 'h') goto yy11;						if(yych >= 'j') goto yy10;					}				} else {					if(yych <= 'v') {						if(yych <= 'r') goto yy9;						goto yy10;					} else {						if(yych <= 'w') goto yy8;						if(yych <= 'z') goto yy10;						goto yy34;					}				}			}		}		++YYCURSOR;		if((yych = *YYCURSOR) == 'f') goto yy67;		goto yy39;yy3:#line 246 "push.fb.re"		{ SEND(kIdentifier);     }#line 364 "<stdout>"yy4:		yych = *++YYCURSOR;		if(yych == 'o') goto yy64;		goto yy39;yy5:		yych = *++YYCURSOR;		if(yych == 'l') goto yy60;		goto yy39;yy6:		yych = *++YYCURSOR;		if(yych == 'o') goto yy56;		goto yy39;yy7:		yych = *++YYCURSOR;		if(yych == 'r') goto yy51;		goto yy39;yy8:		yych = *++YYCURSOR;		if(yych == 'h') goto yy46;		goto yy39;yy9:		yych = *++YYCURSOR;		if(yych == 'e') goto yy40;		goto yy39;yy10:		yych = *++YYCURSOR;		goto yy39;yy11:		yych = *++YYCURSOR;		goto yy39;yy12:		++YYCURSOR;		yych = *YYCURSOR;		goto yy37;yy13:#line 247 "push.fb.re"		{ SEND(kDecimalConstant);}#line 402 "<stdout>"yy14:		++YYCURSOR;#line 249 "push.fb.re"		{ SEND(kEqual);          }#line 407 "<stdout>"yy16:		++YYCURSOR;#line 250 "push.fb.re"		{ SEND(kLeftParen);      }#line 412 "<stdout>"yy18:		++YYCURSOR;#line 251 "push.fb.re"		{ SEND(kRightParen);     }#line 417 "<stdout>"yy20:		++YYCURSOR;#line 252 "push.fb.re"		{ SEND(kMinus);          }#line 422 "<stdout>"yy22:		++YYCURSOR;#line 253 "push.fb.re"		{ SEND(kPlus);           }#line 427 "<stdout>"yy24:		++YYCURSOR;#line 254 "push.fb.re"		{ SEND(kStar);           }#line 432 "<stdout>"yy26:		++YYCURSOR;#line 255 "push.fb.re"		{ SEND(kSlash);          }#line 437 "<stdout>"yy28:		++YYCURSOR;#line 257 "push.fb.re"		{ SKIP();                }#line 442 "<stdout>"yy30:		++YYCURSOR;#line 258 "push.fb.re"		{ SKIP();                }#line 447 "<stdout>"yy32:		++YYCURSOR;#line 259 "push.fb.re"		{ send(kEOF); return 1;  }#line 452 "<stdout>"yy34:		++YYCURSOR;#line 260 "push.fb.re"		{ SEND(kUnknown);        }#line 457 "<stdout>"yy36:		++YYCURSOR;		YYSETSTATE(1);		if(YYLIMIT == YYCURSOR) YYFILL(1);yyFillLabel1:		yych = *YYCURSOR;yy37:		if(yybm[0+yych] & 64) {			goto yy36;		}		goto yy13;yy38:		++YYCURSOR;		YYSETSTATE(2);		if(YYLIMIT == YYCURSOR) YYFILL(1);yyFillLabel2:		yych = *YYCURSOR;yy39:		if(yybm[0+yych] & 128) {			goto yy38;		}		goto yy3;yy40:		yych = *++YYCURSOR;		if(yych != 't') goto yy39;		yych = *++YYCURSOR;		if(yych != 'u') goto yy39;		yych = *++YYCURSOR;		if(yych != 'r') goto yy39;		yych = *++YYCURSOR;		if(yych != 'n') goto yy39;		++YYCURSOR;		if(yybm[0+(yych = *YYCURSOR)] & 128) {			goto yy38;		}#line 245 "push.fb.re"		{ SEND(kReturn);         }#line 495 "<stdout>"yy46:		yych = *++YYCURSOR;		if(yych != 'i') goto yy39;		yych = *++YYCURSOR;		if(yych != 'l') goto yy39;		yych = *++YYCURSOR;		if(yych != 'e') goto yy39;		++YYCURSOR;		if(yybm[0+(yych = *YYCURSOR)] & 128) {			goto yy38;		}#line 244 "push.fb.re"		{ SEND(kWhile);          }#line 509 "<stdout>"yy51:		yych = *++YYCURSOR;		if(yych != 'e') goto yy39;		yych = *++YYCURSOR;		if(yych != 'a') goto yy39;		yych = *++YYCURSOR;		if(yych != 'k') goto yy39;		++YYCURSOR;		if(yybm[0+(yych = *YYCURSOR)] & 128) {			goto yy38;		}#line 243 "push.fb.re"		{ SEND(kBreak);          }#line 523 "<stdout>"yy56:		yych = *++YYCURSOR;		if(yych != 't') goto yy39;		yych = *++YYCURSOR;		if(yych != 'o') goto yy39;		++YYCURSOR;		if(yybm[0+(yych = *YYCURSOR)] & 128) {			goto yy38;		}#line 242 "push.fb.re"		{ SEND(kGoto);           }#line 535 "<stdout>"yy60:		yych = *++YYCURSOR;		if(yych != 's') goto yy39;		yych = *++YYCURSOR;		if(yych != 'e') goto yy39;		++YYCURSOR;		if(yybm[0+(yych = *YYCURSOR)] & 128) {			goto yy38;		}#line 241 "push.fb.re"		{ SEND(kElse);           }#line 547 "<stdout>"yy64:		yych = *++YYCURSOR;		if(yych != 'r') goto yy39;		++YYCURSOR;		if(yybm[0+(yych = *YYCURSOR)] & 128) {			goto yy38;		}#line 240 "push.fb.re"		{ SEND(kFor);            }#line 557 "<stdout>"yy67:		++YYCURSOR;		if(yybm[0+(yych = *YYCURSOR)] & 128) {			goto yy38;		}#line 239 "push.fb.re"		{ SEND(kIf);             }#line 565 "<stdout>"	}}#line 261 "push.fb.re"    fill:        ssize_t unfinishedSize = cursor-start;        printf(            "scanner needs a refill. Exiting for now with:\n"            "    saved fill state = %d\n"            "    unfinished token size = %d\n",            state,            unfinishedSize        );        if(0<unfinishedSize && start<limit)        {            printf("    unfinished token is :");            fwrite(start, 1, cursor-start, stdout);            putchar('\n');        }        putchar('\n');        /*         * Once we get here, we can get rid of         * everything before start and after limit.         */        if(eof==true) goto start;        if(buffer<start)        {            size_t startOffset = start-buffer;            memmove(buffer, start, limit-start);            marker -= startOffset;            cursor -= startOffset;            limit -= startOffset;            start -= startOffset;        }        return 0;    }};// ----------------------------------------------------------------------int main(    int     argc,    char    **argv){    // Parse cmd line    int input = 0;    if(1<argc)    {        input = open(argv[1], O_RDONLY | O_BINARY);        if(input<0)        {            fprintf(                stderr,                "could not open file %s\n",                argv[1]            );            exit(1);        }    }    /*     * Tokenize input file by pushing batches     * of data one by one into the scanner.     */    const size_t batchSize = 256;    uint8_t buffer[batchSize];    PushScanner scanner;    while(1)    {        ssize_t n = read(input, buffer, batchSize);        scanner.push(buffer, n);        if(n<batchSize) break;    }    scanner.push(0, -1);    close(input);    // Done    return 0;}

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -