⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 decipherngram.cc

📁 这是一款很好用的工具包
💻 CC
字号:
/*
 * DecipherNgram.cc --
 *	Approximate N-gram backoff language model used in Decipher recognizer
 *
 */

#ifndef lint
static char Copyright[] = "Copyright (c) 1995, SRI International.  All Rights Reserved.";
static char RcsId[] = "@(#)$Header: /home/srilm/devel/lm/src/RCS/DecipherNgram.cc,v 1.9 2006/01/05 20:21:27 stolcke Exp $";
#endif

#include <iostream>
using namespace std;
#include <stdlib.h>

#include "DecipherNgram.h"

#define DEBUG_NGRAM_HITS 2	/* from Ngram.cc */

DecipherNgram::DecipherNgram(Vocab &vocab, unsigned order, Boolean backoffHack)
      : Ngram(vocab, order), backoffHack(backoffHack)
{
}

/*
 * Simulate the rounding going on from the original LM LogP scores to the
 * bytelogs in the recognizer:
 * - PFSGs encode LogP as intlogs
 * - Nodearray compiler maps intlogs to bytelogs
 */
#define RoundToBytelog(x)	BytelogToLogP(IntlogToBytelog(LogPtoIntlog(x)))

/*
 * The backoff algorithm is similar to Ngram:wordProbBO(),
 * with the following modifications:
 * - bows and probs are truncated to ByteLog precision
 * - the backed-off probability is returned if it is larger than the
 *   direct ngram probability.
 */
LogP
DecipherNgram::wordProbBO(VocabIndex word, const VocabIndex *context, unsigned int clen)
{
    LogP result;
    /*
     * To use the context array for lookup we truncate it to the
     * indicated length, restoring the mangled item on exit.
     */
    VocabIndex saved = context[clen];
    ((VocabIndex *)context)[clen] = Vocab_None;	/* discard const */

    LogP *prob = findProb(word, context);
    LogP boProb = LogP_Zero;

    /*
     * Compute the backed-off probability always
     */
    if (clen > 0) {
	LogP *bow = findBOW(context);

	if (bow) {
	   boProb = RoundToBytelog(*bow) + wordProbBO(word, context, clen - 1);
	} else {
	   boProb = wordProbBO(word, context, clen - 1);
	}
    }
    
    if (prob) {
	result = RoundToBytelog(*prob);

	if (running() && debug(DEBUG_NGRAM_HITS)) {
	    dout() << "[" << (clen + 1) << "gram]";
	}

	if (backoffHack && boProb > result) {
	    result = boProb;

	    if (running() && debug(DEBUG_NGRAM_HITS)) {
		dout() << "[bo]";
	    }
	}
    } else {
	result = boProb;
    }
    ((VocabIndex *)context)[clen] = saved;	/* discard const */
    return result;
}

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -