📄 sfvscanf.c
字号:
/* Copyright (c) Colorado School of Mines, 2006.*//* All rights reserved. */#include "sfhdr.h"/* The main engine for reading formatted data**** Written by Kiem-Phong Vo.*/#define MAXWIDTH (int)(((uint)~0)>>1) /* max amount to scan *//* * pull in a private strtold() */#include "sfstrtof.h"/* refresh stream buffer - taking care of unseekable/share streams too */#if __STD_Cstatic void _sfbuf(Sfio_t* f, int* peek)#elsestatic void _sfbuf(f, peek)Sfio_t* f;int* peek;#endif{ if(f->next >= f->endb) { if(*peek) /* try peeking for a share stream if possible */ { f->mode |= SF_RV; if(SFFILBUF(f,-1) > 0) { f->mode |= SF_PEEK; return; } *peek = 0; /* can't peek, back to normal reads */ } (void)SFFILBUF(f,-1); }}/* buffer used during scanning of a double value or a multi-byte character. the fields mirror certain local variables in sfvscanf. */typedef struct _scan_s{ int error; /* get set by _sfdscan if no value specified */ int inp; /* last input character read */ int width; /* field width */ Sfio_t *f; /* stream being scanned */ uchar *d, *endd, *data; /* local buffering system */ int peek; /* != 0 if unseekable/share stream */ int n_input;/* number of input bytes processed */} Scan_t;/* ds != 0 for scanning double values */#define SCinit(sc,ds) ((sc)->inp = (sc)->error = -1, (sc)->f = f, \ ((sc)->width = (ds) ? width : -1), \ (sc)->d = d, (sc)->endd = endd, (sc)->data = data, \ (sc)->peek = peek, (sc)->n_input = n_input)#define SCend(sc,ds) (inp = (sc)->inp, f = (sc)->f, \ (width = (ds) ? (sc)->width : width), \ d = (sc)->d, endd = (sc)->endd, data = (sc)->data, \ peek = (sc)->peek, n_input = (sc)->n_input)#if __STD_Cstatic int _scgetc(void* arg, int flag)#elsestatic int _scgetc(arg, flag)void* arg;int flag;#endif{ Scan_t *sc = (Scan_t*)arg; if (flag) { sc->error = flag; return 0; } /* if width >= 0, do not allow to exceed width number of bytes */ if(sc->width == 0) { sc->inp = -1; return 0; } if(sc->d >= sc->endd) /* refresh local buffer */ { sc->n_input += sc->d - sc->data; if(sc->peek) SFREAD(sc->f, sc->data, sc->d - sc->data); else sc->f->next = sc->d; _sfbuf(sc->f, &sc->peek); sc->data = sc->d = sc->f->next; sc->endd = sc->f->endb; if(sc->d >= sc->endd) { sc->inp = -1; return 0; } } if((sc->width -= 1) >= 0) /* from _sfdscan */ return (sc->inp = (int)(*sc->d++)); else return ((int)(*sc->d++));}/* structure to match characters in a character class */typedef struct _accept_s{ char ok[SF_MAXCHAR]; int yes; char *form, *endf;#if _has_multibyte wchar_t wc;#endif} Accept_t;#if __STD_Cstatic char* _sfsetclass(const char* form, Accept_t* ac, int flags)#elsestatic char* _sfsetclass(form, ac, flags)char* form; /* format string */Accept_t* ac; /* values of accepted characters */int flags; /* SFFMT_LONG for wchar_t */#endif{ int c, endc, n;#if _has_multibyte SFMBDCL(mbs)#endif if(*form == '^') /* complementing this set */ { ac->yes = 0; form += 1; } else ac->yes = 1; for(c = 0; c <= SF_MAXCHAR; ++c) ac->ok[c] = !ac->yes; if(*form == ']' || *form == '-') /* special first char */ { ac->ok[*form] = ac->yes; form += 1; } ac->form = (char*)form; if(flags&SFFMT_LONG) SFMBCLR(&mbs); for(n = 1; *form != ']'; form += n) { if((c = *((uchar*)form)) == 0) return NIL(char*); if(*(form+1) == '-') { endc = *((uchar*)(form+2));#if _has_multibyte if(c >= 128 || endc >= 128 ) /* range must be ascii */ goto one_char;#endif for(; c <= endc; ++c) ac->ok[c] = ac->yes; n = 3; } else { one_char:#if _has_multibyte /* true multi-byte chars must be checked differently */ if((flags&SFFMT_LONG) && (n = (int)SFMBLEN(form,&mbs)) <= 0) return NIL(char*); if(n == 1)#endif ac->ok[c] = ac->yes; } } ac->endf = (char*)form; return (char*)(form+1);}#if _has_multibyte#if __STD_Cstatic int _sfwaccept(wchar_t wc, Accept_t* ac)#elsestatic int _sfwaccept(wc, ac)wchar_t wc;Accept_t* ac;#endif{ int endc, c, n; wchar_t fwc; char *form = ac->form; SFMBDCL(mbs) SFMBCLR(&mbs); for(n = 1; *form != ']'; form += n) { if((c = *((uchar*)form)) == 0) return 0; if(*(form+1) == '-') { endc = *((uchar*)(form+2)); if(c >= 128 || endc >= 128 ) /* range must be ascii */ goto one_char; n = 3; } else { one_char: if((n = mbrtowc(&fwc, form, ac->endf-form, &mbs)) > 1 && wc == fwc ) return ac->yes; } } return !ac->yes;}#if _has_multibyte == 1#define SFgetwc(sc,wc,fmt,ac,mbs) _sfgetwc(sc,wc,fmt,ac,(Void_t*)(mbs))#else#define SFgetwc(sc,wc,fmt,ac,mbs) _sfgetwc(sc,wc,fmt,ac,NIL(Void_t*))#endif#if __STD_Cstatic int _sfgetwc(Scan_t* sc, wchar_t* wc, int fmt, Accept_t* ac, Void_t *mbs)#elsestatic int _sfgetwc(sc, wc, fmt, ac, mbs)Scan_t* sc; /* the scanning handle */wchar_t* wc; /* to return a scanned wchar_t */int fmt; /* %s, %c, %[ */Accept_t* ac; /* accept handle for %[ */Void_t* mbs; /* multibyte parsing state */#endif{ int n, v; char b[16]; /* assuming that SFMBMAX <= 16! */ /* shift left data so that there will be more room to back up on error. this won't help streams with small buffers - c'est la vie! */ if(sc->d > sc->f->data && (n = sc->endd - sc->d) > 0 && n < SFMBMAX) { memcpy(sc->f->data, sc->d, n); if(sc->f->endr == sc->f->endb) sc->f->endr = sc->f->data+n; if(sc->f->endw == sc->f->endb) sc->f->endw = sc->f->data+n; sc->f->endb = sc->f->data+n; sc->d = sc->data = sc->f->data; sc->endd = sc->f->endb; if(!mbs) sc->f->endb = sc->endd; /* stop cc's "unused mbs" warning */ } for(n = 0; n < SFMBMAX; ) { if((v = _scgetc((Void_t*)sc, 0)) <= 0) goto no_match; else b[n++] = v; if(mbrtowc(wc, b, n, (mbstate_t*)mbs) == (size_t)(-1)) goto no_match; /* malformed multi-byte char */ else { /* multi-byte char converted successfully */ if(fmt == 'c') return 1; else if(fmt == 's') { if(n > 1 || (n == 1 && !isspace(b[0]) ) ) return 1; else goto no_match; } else if(fmt == '[') { if((n == 1 && ac->ok[b[0]]) || (n > 1 && _sfwaccept(*wc,ac)) ) return 1; else goto no_match; } else /* if(fmt == '1') match a single wchar_t */ { if(*wc == ac->wc) return 1; else goto no_match; } } }no_match: /* this unget is lossy on a stream with small buffer */ if((sc->d -= n) < sc->data) sc->d = sc->data; return 0;}#endif /*_has_multibyte*/#if __STD_Cint sfvscanf(Sfio_t* f, reg const char* form, va_list args)#elseint sfvscanf(f,form,args)Sfio_t* f; /* file to be scanned */reg char* form; /* scanning format */va_list args;#endif{ reg int inp, shift, base, width; ssize_t size; int fmt, flags, dot, n_assign, v, n, n_input; char *sp; Accept_t acc; Argv_t argv; Sffmt_t *ft; Fmt_t *fm, *fmstk; Fmtpos_t* fp; char *oform; va_list oargs; int argp, argn; int decimal = 0, thousand = 0;#if _has_multibyte wchar_t wc; SFMBDCL(fmbs) SFMBDCL(mbs)#endif Void_t* value; /* location to assign scanned value */ char* t_str; ssize_t n_str; /* local buffering system */ Scan_t scd; uchar *d, *endd, *data; int peek;#define SFbuf(f) (_sfbuf(f,&peek), (data = d = f->next), (endd = f->endb) )#define SFlen(f) (d - data)#define SFinit(f) ((peek = f->extent < 0 && (f->flags&SF_SHARE)), SFbuf(f) )#define SFend(f) ((n_input += SFlen(f)), \ (peek ? SFREAD(f,(Void_t*)data,SFlen(f)) : ((f->next = d),0)) )#define SFgetc(f,c) ((c) = (d < endd || (SFend(f), SFbuf(f), d < endd)) ? \ (int)(*d++) : -1 )#define SFungetc(f,c) (d -= 1) SFCVINIT(); /* initialize conversion tables */ SFMTXSTART(f,-1); if(!form || f->mode != SF_READ && _sfmode(f,SF_READ,0) < 0) SFMTXRETURN(f, -1); SFLOCK(f,0); SFinit(f); /* initialize local buffering system */ n_assign = n_input = 0; inp = -1; fmstk = NIL(Fmt_t*); ft = NIL(Sffmt_t*); fp = NIL(Fmtpos_t*); argn = -1; oform = (char*)form; va_copy(oargs,args); SFSETLOCALE(&decimal, &thousand);loop_fmt: SFMBCLR(&fmbs); while((fmt = *form++)) { if(fmt != '%') { if(isspace(fmt)) { if(fmt != '\n' || !(f->flags&SF_LINE)) fmt = -1; for(;;) { if(SFgetc(f,inp) < 0 || inp == fmt) goto loop_fmt; else if(!isspace(inp)) { SFungetc(f,inp); goto loop_fmt; } } } else { match_1:#if _has_multibyte if((n = (int)mbrtowc(&wc,form-1,SFMBMAX,&fmbs)) <= 0) goto pop_fmt; if(n > 1) { acc.wc = wc; SCinit(&scd,0); SFMBCLR(&mbs); v = SFgetwc(&scd, &wc, '1', &acc, &mbs); SCend(&scd,0); if(v == 0) goto pop_fmt; form += n-1; } else#endif if(SFgetc(f,inp) != fmt) { if(inp < 0) goto done; SFungetc(f,inp); goto pop_fmt; } } continue; } if(*form == '%') { form += 1; goto match_1; } if(*form == '\0') goto pop_fmt; if(*form == '*') { flags = SFFMT_SKIP; form += 1; } else flags = 0; /* matching some pattern */ base = 10; size = -1; width = dot = 0; t_str = NIL(char*); n_str = 0; value = NIL(Void_t*); argp = -1; loop_flags: /* LOOP FOR FLAGS, WIDTH, BASE, TYPE */ switch((fmt = *form++) ) { case LEFTP : /* get the type which is enclosed in balanced () */ t_str = (char*)form; for(v = 1;;) { switch(*form++) { case 0 : /* not balanceable, retract */ form = t_str; t_str = NIL(char*); n_str = 0; goto loop_flags; case LEFTP : /* increasing nested level */ v += 1; continue; case RIGHTP : /* decreasing nested level */ if((v -= 1) != 0) continue; if(*t_str != '*' ) n_str = (form-1) - t_str; else { t_str = (*_Sffmtintf)(t_str+1,&n); if(*t_str == '$') { if(!fp && !(fp = (*_Sffmtposf) (f,oform,oargs,ft,1)) ) goto pop_fmt; n = FP_SET(n,argn); } else n = FP_SET(-1,argn); if(fp) { t_str = fp[n].argv.s; n_str = fp[n].ft.size; } else if(ft && ft->extf ) { FMTSET(ft, form,args, LEFTP, 0, 0, 0,0,0, NIL(char*),0); n = (*ft->extf) (f,(Void_t*)&argv,ft); if(n < 0) goto pop_fmt; if(!(ft->flags&SFFMT_VALUE) ) goto t_arg; if((t_str = argv.s) && (n_str = (int)ft->size) < 0) n_str = strlen(t_str); } else { t_arg: if((t_str = va_arg(args,char*)) ) n_str = strlen(t_str); } } goto loop_flags; } } case '#' : /* alternative format */ flags |= SFFMT_ALTER; goto loop_flags; case '.' : /* width & base */ dot += 1; if(isdigit(*form)) { fmt = *form++; goto dot_size; } else if(*form == '*') { form = (*_Sffmtintf)(form+1,&n); if(*form == '$') { form += 1; if(!fp && !(fp = (*_Sffmtposf)(f,oform,oargs,ft,1)) ) goto pop_fmt; n = FP_SET(n,argn); } else n = FP_SET(-1,argn); if(fp) v = fp[n].argv.i; else if(ft && ft->extf ) { FMTSET(ft, form,args, '.',dot, 0, 0,0,0, NIL(char*), 0); if((*ft->extf)(f, (Void_t*)(&argv), ft) < 0) goto pop_fmt; if(ft->flags&SFFMT_VALUE) v = argv.i; else v = (dot <= 2) ? va_arg(args,int) : 0; } else v = (dot <= 2) ? va_arg(args,int) : 0; if(v < 0) v = 0; goto dot_set; } else goto loop_flags; case '0' : case '1' : case '2' : case '3' : case '4' : case '5' : case '6' : case '7' : case '8' : case '9' : dot_size : for(v = fmt-'0'; isdigit(*form); ++form) v = v*10 + (*form - '0'); if(*form == '$') { form += 1; if(!fp && !(fp = (*_Sffmtposf)(f,oform,oargs,ft,1)) ) goto pop_fmt; argp = v-1; goto loop_flags; } dot_set : if(dot == 0 || dot == 1) width = v; else if(dot == 2) base = v; goto loop_flags; case 'I' : /* object size */ size = -1; flags = (flags & ~SFFMT_TYPES) | SFFMT_IFLAG; if(isdigit(*form))
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -