dfa.cpp

来自「开放源码的编译器open watcom 1.6.0版的源代码」· C++ 代码 · 共 256 行

CPP
256
字号
/****************************************************************************
*
*                            Open Watcom Project
*
*    Portions Copyright (c) 1983-2002 Sybase, Inc. All Rights Reserved.
*
*  ========================================================================
*
*    This file contains Original Code and/or Modifications of Original
*    Code as defined in and that are subject to the Sybase Open Watcom
*    Public License version 1.0 (the 'License'). You may not use this file
*    except in compliance with the License. BY USING THIS FILE YOU AGREE TO
*    ALL TERMS AND CONDITIONS OF THE LICENSE. A copy of the License is
*    provided with the Original Code and Modifications, and is also
*    available at www.sybase.com/developer/opensource.
*
*    The Original Code and all software distributed under the License are
*    distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
*    EXPRESS OR IMPLIED, AND SYBASE AND ALL CONTRIBUTORS HEREBY DISCLAIM
*    ALL SUCH WARRANTIES, INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF
*    MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR
*    NON-INFRINGEMENT. Please see the License for the specific language
*    governing rights and limitations under the License.
*
*  ========================================================================
*
* Description:  WHEN YOU FIGURE OUT WHAT THIS FILE DOES, PLEASE
*               DESCRIBE IT HERE!
*
****************************************************************************/


#include <stdlib.h>
#include <ctype.h>
#include <string.h>
#include "globals.h"
#include "substr.h"
#include "dfa.h"

inline char octCh(uint c){
    return '0' + (char)c%8;
}

void prtCh(ostream &o, uchar c){
    uchar oc = talx[c];
    switch(oc){
    case '\'': o << "\\'"; break;
    case '\n': o << "\\n"; break;
    case '\t': o << "\\t"; break;
    case '\v': o << "\\v"; break;
    case '\b': o << "\\b"; break;
    case '\r': o << "\\r"; break;
    case '\f': o << "\\f"; break;
    case '\a': o << "\\a"; break;
    case '\\': o << "\\\\"; break;
    default:
    if(isprint(oc))
        o << (char) oc;
    else
        o << '\\' << octCh(c/64) << octCh(c/8) << octCh(c);
    }
}

void printSpan(ostream &o, uint lb, uint ub){
    if(lb > ub)
    o << "*";
    o << "[";
    if((ub - lb) == 1){
    prtCh(o, (uchar)lb);
    } else {
    prtCh(o, (uchar)lb);
    o << "-";
    prtCh(o, (uchar)ub-1);
    }
    o << "]";
}

uint Span::show(ostream &o, uint lb){
    if(to){
    printSpan(o, lb, ub);
    o << " " << to->label << "; ";
    }
    return ub;
}

ostream& operator<<(ostream &o, const State &s){
    o << "state " << s.label;
    if(s.rule)
    o << " accepts " << s.rule->accept;
    o << "\n";
    uint lb = 0;
    for(uint i = 0; i < s.go.nSpans; ++i)
    lb = s.go.span[i].show(o, lb);
    return o;
}

ostream& operator<<(ostream &o, const DFA &dfa){
    for(State *s = dfa.head; s; s = s->next)
    o << s << "\n\n";
    return o;
}

State::State() : rule(NULL), action(NULL), link(NULL), kCount(0), kernel(NULL) {
    go.nSpans = 0;
    go.span = NULL;
}

State::~State(){
    delete [] kernel;
    delete [] go.span;
}

static Ins **closure(Ins **cP, Ins *i){
    while(!isMarked(i)){
    mark(i);
    *(cP++) = i;
    if(i->i.tag == FORK){
        cP = closure(cP, i + 1);
        i = (Ins*) i->i.link;
    } else if(i->i.tag == GOTO){
        i = (Ins*) i->i.link;
    } else
        break;
    }
    return cP;
}

struct GoTo {
    Char    ch;
    void    *to;
};

DFA::DFA(Ins *ins, uint ni, uint lb, uint ub, Char *rep)
    : lbChar(lb), ubChar(ub) {
    Ins **work = new Ins*[ni+1];
    uint nc = ub - lb;
    GoTo *goTo = new GoTo[nc];
    Span *span = new Span[nc];
    memset((char*) goTo, 0, nc*sizeof(GoTo));
    tail = &head;
    head = NULL;
    nStates = 0;
    toDo = NULL;
    findState(work, closure(work, &ins[0]) - work);
    while(toDo){
    State *s = toDo;
    toDo = s->link;

    Ins **cP, **iP;
    Ins *i;
    uint nGoTos = 0, j;

    s->rule = NULL;
    for(iP = s->kernel; (i = *iP) != NULL; ++iP){
        if(i->i.tag == CHAR){
        for(Ins *j = i + 1; j < (Ins*) i->i.link; ++j){
            if((j->c.link = goTo[j->c.value - lb].to) == 0)
            goTo[nGoTos++].ch = (Char)j->c.value;
            goTo[j->c.value - lb].to = j;
        }
        } else if(i->i.tag == TERM){
        if(!s->rule || ((RuleOp*) i->i.link)->accept < s->rule->accept)
            s->rule = (RuleOp*) i->i.link;
        }
    }

    for(j = 0; j < nGoTos; ++j){
        GoTo *go = &goTo[goTo[j].ch - lb];
        i = (Ins*) go->to;
        for(cP = work; i; i = (Ins*) i->c.link)
        cP = closure(cP, i + i->c.bump);
        go->to = findState(work, cP - work);
    }

    s->go.nSpans = 0;
    for(j = 0; j < nc;){
        State *to = (State*) goTo[rep[j]].to;
        while(++j < nc && goTo[rep[j]].to == to);
        span[s->go.nSpans].ub = lb + j;
        span[s->go.nSpans].to = to;
        s->go.nSpans++;
    }

    for(j = nGoTos; j-- > 0;)
        goTo[goTo[j].ch - lb].to = NULL;

    s->go.span = new Span[s->go.nSpans];
    memcpy((char*) s->go.span, (char*) span, s->go.nSpans*sizeof(Span));

    (void) new Match(s);

    }
    delete [] work;
    delete [] goTo;
    delete [] span;
}

DFA::~DFA(){
    State *s;
    while((s = head) != NULL){
    head = s->next;
    delete s;
    }
}

void DFA::addState(State **a, State *s){
    s->label = nStates++;
    s->next = *a;
    *a = s;
    if(a == tail)
    tail = &s->next;
}

State *DFA::findState(Ins **kernel, uint kCount){
    Ins **cP, **iP;
    Ins *i;
    State *s;

    kernel[kCount] = NULL;

    cP = kernel;
    for(iP = kernel; (i = *iP) != NULL; ++iP){
     if(i->i.tag == CHAR || i->i.tag == TERM){
         *cP++ = i;
    } else {
         unmark(i);
    }
    }
    kCount = cP - kernel;
    kernel[kCount] = NULL;

    for(s = head; s; s = s->next){
     if(s->kCount == kCount){
         for(iP = s->kernel; (i = *iP) != 0; ++iP)
         if(!isMarked(i))
             goto nextState;
         goto unmarkAll;
     }
     nextState:;
    }

    s = new State;
    addState(tail, s);
    s->kCount = kCount;
    s->kernel = new Ins*[kCount+1];
    memcpy(s->kernel, kernel, (kCount+1)*sizeof(Ins*));
    s->link = toDo;
    toDo = s;

unmarkAll:
    for(iP = kernel; (i = *iP) != NULL; ++iP)
     unmark(i);

    return s;
}

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?