scan.c
来自「开放源码的编译器open watcom 1.6.0版的源代码」· C语言 代码 · 共 356 行
C
356 行
/****************************************************************************
*
* Open Watcom Project
*
* Portions Copyright (c) 1983-2002 Sybase, Inc. All Rights Reserved.
*
* ========================================================================
*
* This file contains Original Code and/or Modifications of Original
* Code as defined in and that are subject to the Sybase Open Watcom
* Public License version 1.0 (the 'License'). You may not use this file
* except in compliance with the License. BY USING THIS FILE YOU AGREE TO
* ALL TERMS AND CONDITIONS OF THE LICENSE. A copy of the License is
* provided with the Original Code and Modifications, and is also
* available at www.sybase.com/developer/opensource.
*
* The Original Code and all software distributed under the License are
* distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
* EXPRESS OR IMPLIED, AND SYBASE AND ALL CONTRIBUTORS HEREBY DISCLAIM
* ALL SUCH WARRANTIES, INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR
* NON-INFRINGEMENT. Please see the License for the specific language
* governing rights and limitations under the License.
*
* ========================================================================
*
* Description: WHEN YOU FIGURE OUT WHAT THIS FILE DOES, PLEASE
* DESCRIBE IT HERE!
*
****************************************************************************/
#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <io.h>
#include "defgen.h"
#include "ytab.h"
#include "scan.h"
/*
T_NAME := [A-Z|a-z|_][A-Z|a-z|0-9|_]*
T_NUM := [0-9]*
T_LPAREN := (
T_RPAREN := )
T_LSQ_BRACKET := [
T_RSQ_BRACKET := ]
T_SEMICOLON := ;
T_STAR := *
T_COMMA := ,
T_POUND := #
T_SLASH := /
*/
#define BUF_SIZE 512
static int FileHdl;
static char Buffer[512];
static char *BufEnd;
static char *CurPos;
typedef struct {
char *str;
int tok;
} KeyWord;
static KeyWord ReservedWords[] = {
"__cdecl", T_CDECL,
"__export", T_EXPORT,
"__far", T_FAR,
"__fortran", T_FORTRAN,
"__huge", T_HUGE,
"__near", T_NEAR,
"__pascal", T_PASCAL,
"__syscall", T_SYSCALL,
"char", T_CHAR,
"const", T_CONST,
"double", T_DOUBLE,
"extern", T_EXTERN,
"float", T_FLOAT,
"int", T_INT,
"line", T_LINE,
"long", T_LONG,
"pascal", T_PASCAL,
"short", T_SHORT,
"signed", T_SIGNED,
"struct", T_STRUCT,
"union", T_UNION,
"unsigned", T_UNSIGNED,
"void", T_VOID
};
static int GetNextChar( void ) {
char ch;
int size;
if( CurPos == BufEnd ) {
size = read( FileHdl, Buffer, BUF_SIZE );
if( size == 0 || size == -1 ) {
return( EOF );
}
BufEnd = Buffer + size;
CurPos = Buffer;
}
ch = *CurPos;
CurPos++;
return( ch );
}
static void PutBackChar( void ) {
CurPos--;
}
int MyComp( const void *p1, const void *p2 ) {
KeyWord *ptr;
ptr = (KeyWord *)p2;
return( strcmp( p1, ptr->str ) );
}
static int CheckReservedWords( char *tokbuf ) {
KeyWord *match;
match = bsearch( tokbuf, ReservedWords,
sizeof( ReservedWords ) / sizeof( KeyWord ),
sizeof( KeyWord ), MyComp );
if( match == NULL ) {
return( T_NAME );
} else {
return( match->tok );
}
}
BOOL ScanInit( char *fname ) {
FileHdl = open( fname, O_RDONLY | O_TEXT );
BufEnd = Buffer;
CurPos = BufEnd;
if( FileHdl == -1 ) {
ReportError( "Unable to open '%s'", fname );
return( TRUE );
} else {
return( FALSE );
}
}
void ScanFini( void ) {
close( FileHdl );
}
typedef enum {
ST_START,
ST_NAME,
ST_NUM,
ST_FNAME,
ST_STRING,
ST_ERR
} ScanState;
int Scan( ScanValue *val ) {
ScanState state;
char ch;
unsigned len;
int ret;
char token[256]; // BEWARE-assume no token is more than
// 256 characters
state = ST_START;
len = 0;
for( ;; ) {
switch( state ) {
case ST_START:
ch = GetNextChar();
while( isspace( ch ) ) ch = GetNextChar();
switch( ch ) {
case '(':
return( T_LPAREN );
case ')':
return( T_RPAREN );
case '[':
return( T_LSQ_BRACKET );
case ']':
return( T_RSQ_BRACKET );
case ';':
return( T_SEMICOLON );
case '*':
return( T_STAR );
case ',':
return( T_COMMA );
case '#':
return( T_POUND );
case '/':
return( T_SLASH );
case '.':
return( T_PERIOD );
case EOF:
return( 0 );
case '"':
state = ST_STRING;
break;
case '\\':
state = ST_FNAME;
token[len] = ch;
len++;
break;
default:
if( ch == '_' || isalpha( ch ) ) {
state = ST_NAME;
token[len] = ch;
len++;
} else if( isdigit( ch ) ) {
state = ST_NUM;
token[len] = ch;
len++;
} else {
state = ST_ERR;
}
break;
}
break;
case ST_ERR:
ReportError( "Scanner Error" );
return( 0 );
break;
case ST_NAME:
ch = GetNextChar();
while( isalnum( ch ) || ch == '_' ) {
token[len] = ch;
len++;
ch = GetNextChar();
}
if( ch == '.' || ch == ':' || ch == '\\' ) {
state = ST_FNAME;
token[len] = ch;
len++;
} else {
token[len] = '\0';
PutBackChar();
ret = CheckReservedWords( token );
val->str = malloc( strlen( token ) + 1 );
strcpy( val->str, token );
return( ret );
}
break;
case ST_NUM:
ch = GetNextChar();
while( isdigit( ch ) ) {
token[len] = ch;
len++;
ch = GetNextChar();
}
if( isalnum( ch ) || ch == '_' || ch == '.' || ch == '\\' ) {
state = ST_FNAME;
token[len] = ch;
len++;
} else {
PutBackChar();
token[len] = '\0';
val->str = malloc( strlen( token ) + 1 );
strcpy( val->str, token );
return( T_NUM );
}
break;
case ST_FNAME:
ch = GetNextChar();
while( isalnum( ch ) || ch == '_' || ch == '.' || ch == '\\'
|| ch == ':' ) {
token[len] = ch;
len++;
ch = GetNextChar();
}
token[len] = '\0';
PutBackChar();
val->str = malloc( strlen( token ) + 1 );
strcpy( val->str, token );
return( T_FNAME );
break;
case ST_STRING:
ch = GetNextChar();
while( ch != '"' ) {
token[len] = ch;
len++;
ch = GetNextChar();
}
token[len] = '\0';
val->str = malloc( strlen( token ) + 1 );
strcpy( val->str, token );
return( T_STRING );
break;
}
}
}
#if(0)
int Scan( ScanValue *val ) {
int ch;
char tokbuf[256]; // BEWARE-assume no token is more than
// 256 characters
unsigned len;
int ret;
ch = GetNextChar();
while( isspace( ch ) ) ch = GetNextChar();
if( ch == '_' || isalpha( ch ) ) {
len = 0;
while( ch == '_' || isalnum( ch ) ) {
tokbuf[len] = (char)(ch & 0xFF);
len++;
ch = GetNextChar();
}
tokbuf[len] = '\0';
PutBackChar();
ret = CheckReservedWords( tokbuf );
val->str = malloc( strlen( tokbuf ) + 1 );
strcpy( val->str, tokbuf );
return( ret );
} else if( isdigit( ch ) ) {
while( isdigit( ch ) ) {
ch = GetNextChar();
}
PutBackChar();
return( T_NUM );
} else switch( ch ) {
case '(':
return( T_LPAREN );
case ')':
return( T_RPAREN );
case '[':
return( T_LSQ_BRACKET );
case ']':
return( T_RSQ_BRACKET );
case ';':
return( T_SEMICOLON );
case '*':
return( T_STAR );
case ',':
return( T_COMMA );
case '#':
return( T_POUND );
case '/':
return( T_SLASH );
case EOF:
return( 0 );
default:
//NYI - report an error
return( 0 );
break;
}
}
#endif
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?