gneuralnet.cpp

来自「一个由Mike Gashler完成的机器学习方面的includes neural」· C++ 代码 · 共 996 行 · 第 1/2 页
CPP
996 行
				for(i = 0; i < nValueCount; i++)					pInternal[nInternalIndex + i] = OUTPUT_MIN;				if(pExternal[nExternalIndex] != -1) // -1 = unknown value				{					GAssert((int)pExternal[nExternalIndex] >= 0 && (int)pExternal[nExternalIndex] < nValueCount, "out of range");					pInternal[nInternalIndex + (int)pExternal[nExternalIndex]] = OUTPUT_MIN + OUTPUT_RANGE;				}				nInternalIndex += nValueCount;			}		}	}	GAssert(nInternalIndex == m_pInternalRelation->GetAttributeCount(), "error");}void GNeuralNet::OutputsToExternal(double* pInternal, double* pExternal){	GAssert(m_pMinAndRanges, "min and ranges not calculated yet");	GArffAttribute* pAttr;	int nValueCount;	int nOutputCount = m_pRelation->GetOutputCount();	int nInternalIndex = m_pInternalRelation->GetOutputIndex(0);	int n, nExternalIndex;	for(n = 0; n < nOutputCount; n++)	{		nExternalIndex = m_pRelation->GetOutputIndex(n);		pAttr = m_pRelation->GetAttribute(nExternalIndex);		if(pAttr->IsContinuous())			pExternal[nExternalIndex] = GArffData::Normalize(pInternal[nInternalIndex++], OUTPUT_MIN, OUTPUT_RANGE, m_pMinAndRanges[nExternalIndex + nExternalIndex], m_pMinAndRanges[nExternalIndex + nExternalIndex + 1]);		else		{			nValueCount = pAttr->GetValueCount();			if(nValueCount <= 2)				pExternal[nExternalIndex] = (pInternal[nInternalIndex++] >= OUTPUT_MIDDLE ? 1 : 0);			else			{				pExternal[nExternalIndex] = GVector::FindMax(&pInternal[nInternalIndex], nValueCount);				nInternalIndex += nValueCount;			}		}	}	GAssert(nInternalIndex == m_pInternalRelation->GetAttributeCount(), "error");}void GNeuralNet::AddLayer(int nNodes){	GAssert(m_nInputStart == 0, "already made the input layer");	int nPrevLayerStart = m_nLayerStart;	int nPrevLayerSize = m_nLayerSize;	m_nLayerStart = m_pNeurons->GetSize();	m_nLayerSize = nNodes;	int n, i;	for(n = 0; n < nNodes; n++)	{		GStandardNeuron* pNewNeuron = new GStandardNeuron();		m_pNeurons->AddPointer(pNewNeuron);		for(i = 0; i < nPrevLayerSize; i++)		{			GNeuron* pOldNeuron = (GNeuron*)m_pNeurons->GetPointer(nPrevLayerStart + i);			pOldNeuron->AddInput(pNewNeuron);		}	}}int GNeuralNet::GetWeightCount(){	if(m_nWeightCount == 0)	{		int n;		int nCount = m_pNeurons->GetSize();		GNeuron* pNeuron;		for(n = 0; n < nCount; n++)		{			pNeuron = (GNeuron*)m_pNeurons->GetPointer(n);			m_nWeightCount += pNeuron->SerializeWeights(NULL);		}	}	return m_nWeightCount;}void GNeuralNet::GetWeights(double* pOutWeights){	// Serialize the weights	int nCount = m_pNeurons->GetSize();	int nPos = 0;	int n;	GNeuron* pNeuron;	for(n = 0; n < nCount; n++)	{		pNeuron = (GNeuron*)m_pNeurons->GetPointer(n);		nPos += pNeuron->SerializeWeights(&pOutWeights[nPos]);	}	GAssert(nPos == m_nWeightCount, "serialization size inconsistent");}void GNeuralNet::SetWeights(double* pWeights){	int n;	int nCount = m_pNeurons->GetSize();	GNeuron* pNeuron;	int nPos = 0;	for(n = 0; n < nCount; n++)	{		pNeuron = (GNeuron*)m_pNeurons->GetPointer(n);		nPos += pNeuron->DeserializeWeights(&pWeights[nPos]);	}	GAssert(nPos == m_nWeightCount, "serialization size inconsistent");}void GNeuralNet::UpdateBestWeights(){	if(!m_pBestSet)		m_pBestSet = new double[GetWeightCount()];	GetWeights(m_pBestSet);}void GNeuralNet::RestoreBestWeights(){	SetWeights(m_pBestSet);}void GNeuralNet::EvalInternal(double* pRow){	// Clear the outputs of all non-input neurons	GNeuron* pNeuron;	int n;	for(n = 0; n < m_nInputStart; n++)	{		pNeuron = (GNeuron*)m_pNeurons->GetPointer(n);		pNeuron->SetOutput(1e50);	}	// Copy inputs into input neurons	int nInputs = m_pInternalRelation->GetInputCount();	int nCount = m_nInputStart + nInputs;	GAssert(nCount == m_pNeurons->GetSize(), "neurons added after input neurons?");	int nInput = 0;	for( ; n < nCount; n++)	{		pNeuron = (GNeuron*)m_pNeurons->GetPointer(n);		pNeuron->SetOutput(pRow[nInput++]);	}	// Pull the evaluation downstream to the output nodes	int nOutputs = m_pInternalRelation->GetOutputCount();	for(n = 0; n < nOutputs; n++)	{		pNeuron = (GNeuron*)m_pNeurons->GetPointer(n);		pNeuron->PullEvalDownStream();	}}void GNeuralNet::Eval(double* pRow){	// Convert to internal data	double* pInternalRow = (double*)alloca(sizeof(double) * m_pInternalRelation->GetAttributeCount());	InputsToInternal(pRow, pInternalRow);	// Do the evaluation	EvalInternal(pInternalRow);	// Extract the output values from the output nodes	GNeuron* pNeuron;	int n;	int nOutputs = m_pInternalRelation->GetOutputCount();	int nIndex = m_pInternalRelation->GetOutputIndex(0);	for(n = 0; n < nOutputs; n++)	{		pNeuron = (GNeuron*)m_pNeurons->GetPointer(n);		pInternalRow[nIndex++] = pNeuron->GetOutput();	}	// Convert outputs to external data	OutputsToExternal(pInternalRow, pRow);}double GNeuralNet::Criticize(double* pModel){	// Calculate the error on all output nodes	GNeuron* pNeuron = NULL;	int n;	double dOutput;	double dSumSquaredError = 0;	double dDelta;	int nOutputs = m_pInternalRelation->GetOutputCount();	int nIndex = m_pInternalRelation->GetOutputIndex(0);	for(n = 0; n < nOutputs; n++)	{		pNeuron = (GNeuron*)m_pNeurons->GetPointer(n);		dOutput = pNeuron->GetOutput();		dDelta = pModel[nIndex++] - dOutput;		dSumSquaredError += (dDelta * dDelta);		pNeuron->SetError(dDelta * dOutput * (1.0 - dOutput));	}	// Clear the error on the rest of the nodes	for( ; n < m_nInputStart; n++)	{		pNeuron = (GNeuron*)m_pNeurons->GetPointer(n);		pNeuron->SetError(1e50);	}	// Backpropagate the error to all but the input layers	for(n = m_nLayerStart; n < m_nInputStart; n++) // m_nLayerStart now points to the last non-input layer	{		pNeuron = (GNeuron*)m_pNeurons->GetPointer(n);		pNeuron->PullErrorBackUpStream();	}	return dSumSquaredError;}void GNeuralNet::MeasureMinAndRanges(GArffData* pTrainingData){	delete(m_pMinAndRanges);	int nAttrCount = m_pRelation->GetAttributeCount();	m_pMinAndRanges = new double[2 * nAttrCount];	GArffAttribute* pAttr;	int n;	for(n = 0; n < nAttrCount; n++)	{		pAttr = m_pRelation->GetAttribute(n);		if(pAttr->IsContinuous())		{			pTrainingData->GetMinAndRange(n, &m_pMinAndRanges[2 * n], &m_pMinAndRanges[2 * n + 1]);			if(m_pMinAndRanges[2 * n + 1] < .00001)				m_pMinAndRanges[2 * n + 1] = .00001;		}		else		{			m_pMinAndRanges[2 * n] = 0;			m_pMinAndRanges[2 * n + 1] = 0;		}	}}void GNeuralNet::ExternalToInternalData(GArffData* pExternal, GArffData* pInternal){	double* pExternalRow;	double* pInternalRow;	int n;	int nInternalAttributeCount = m_pInternalRelation->GetAttributeCount();	int nRowCount = pExternal->GetSize();	for(n = 0; n < nRowCount; n++)	{		pExternalRow = pExternal->GetVector(n);		pInternalRow = new double[nInternalAttributeCount];		InputsToInternal(pExternalRow, pInternalRow);		OutputsToInternal(pExternalRow, pInternalRow);		pInternal->AddVector(pInternalRow);	}}double GNeuralNet::TrainValidate(){	int n, i, nIndex;	GNeuron* pNeuron;	double* pRow;	double d;	double dError = 0;	int nCount = m_pValidationDataInternal->GetSize();	int nOutputs = m_pInternalRelation->GetOutputCount();	for(n = 0; n < nCount; n++)	{		pRow = m_pValidationDataInternal->GetVector(n);		EvalInternal(pRow);		nIndex = m_pInternalRelation->GetOutputIndex(0);		for(i = 0; i < nOutputs; i++)		{			pNeuron = (GNeuron*)m_pNeurons->GetPointer(i);			d = pRow[nIndex++] - pNeuron->GetOutput();			d *= d;			dError += d;		}	}	dError /= (nCount * nOutputs);	return dError;}void GNeuralNet::PrintNeurons(){	printf("-----------------\n");	GNeuron* pNeuron;	int n;	for(n = 0; n < m_nInputStart; n++)	{		pNeuron = (GNeuron*)m_pNeurons->GetPointer(n);		printf("Neuron %d\n", n);		pNeuron->Print();	}	printf("-----------------\n");}void GNeuralNet::Train(GArffData* pData){	int nTrainRows = (int)(m_dTrainingPortion * pData->GetSize());	GArffData* pValidateData = pData->SplitBySize(nTrainRows);	Train(pData, pValidateData);}int GNeuralNet::Train(GArffData* pTrainingData, GArffData* pValidationData){	TrainInit(pTrainingData, pValidationData);	// Do the epochs	int nEpochs;	double dBestError = 1e20;	int nEpochsSinceValidationCheck = 0;	int nBestEpoch = 0;	for(nEpochs = 0; true; nEpochs++)	{		TrainEpoch();		// Check for termination condition		nEpochsSinceValidationCheck++;		if(nEpochsSinceValidationCheck >= m_nEpochsPerValidationCheck)		{			nEpochsSinceValidationCheck = 0;			double dMeanSquareError = TrainValidate();//printf("Epoch: %d\tError=%lf\n", nEpochs, dBestError);			if(dMeanSquareError < dBestError)			{				// Found a new best set of weights				dBestError = dMeanSquareError;				nBestEpoch = nEpochs;				UpdateBestWeights();				if(dMeanSquareError <= m_dAcceptableMeanSquareError)					break;			}			else			{				// Test for termination condition				if(nEpochs - nBestEpoch >= m_nRunEpochs)					break;			}			if(nEpochs >= m_nMaximumEpochs)				break;		}	}	if(dBestError < 1e20)		RestoreBestWeights();	else	{		GAssert(false, "Total failure!");	}	ReleaseInternalData();	return nEpochs;}void GNeuralNet::TrainInit(GArffData* pTrainingData, GArffData* pValidationData){	GAssert(m_nRunEpochs <= m_nMaximumEpochs, "conflicting settings");	// Add the input layer	MakeInputLayer();	// Make the internal data	MeasureMinAndRanges(pTrainingData);	ReleaseInternalData();	m_pTrainingDataInternal = new GArffData(pTrainingData->GetSize());	ExternalToInternalData(pTrainingData, m_pTrainingDataInternal);	if(pTrainingData == pValidationData)		m_pValidationDataInternal = m_pTrainingDataInternal;	else	{		m_pValidationDataInternal = new GArffData(pValidationData->GetSize());		ExternalToInternalData(pValidationData, m_pValidationDataInternal);	}}void GNeuralNet::IncrementalInit(int nBatchSize, double dMin, double dRange){	// Add the input layer	MakeInputLayer();	// Set the mins and ranges	delete(m_pMinAndRanges);	int nAttrCount = m_pRelation->GetAttributeCount();	m_pMinAndRanges = new double[2 * nAttrCount];	int n;	for(n = 0; n < nAttrCount; n++)	{		m_pMinAndRanges[2 * n] = dMin;		m_pMinAndRanges[2 * n + 1] = dRange;	}	// Make the batch data	ReleaseInternalData();	m_pTrainingDataInternal = new GArffData(nBatchSize);}void GNeuralNet::TrainEpoch(){	// Shuffle the data set	m_pTrainingDataInternal->Shuffle();	// Do a single epoch	m_dSumSquaredError = 0;	double* pRow;	GNeuron* pNeuron;	int n, i;	int nRowCount = m_pTrainingDataInternal->GetSize();	for(n = 0; n < nRowCount; n++)	{		// Compute output for this row and update the weights		pRow = m_pTrainingDataInternal->GetVector(n);		EvalInternal(pRow);		// Backpropagate the error		m_dSumSquaredError += Criticize(pRow);		// Adjust the weights in a gradient descent manner		for(i = 0; i < m_nInputStart; i++)		{			pNeuron = (GNeuron*)m_pNeurons->GetPointer(i);			pNeuron->AdjustWeights(m_dLearningRate, m_dMomentum);		}	}	m_dLearningRate *= m_dLearningDecay;	m_nEpochs++;}int GNeuralNet::TrainBatch(GArffData* pTrainingData, GArffData* pValidationData){	TrainInit(pTrainingData, pValidationData);	// Do the epochs	double* pRow;	GNeuron* pNeuron;	int n, i, nEpochs;	double dBestError = 1e20;	int nRowCount = m_pTrainingDataInternal->GetSize();	int nEpochsSinceValidationCheck = 0;	int nBestEpoch = 0;	for(nEpochs = 0; true; nEpochs++)	{		// Train with each of the training examples (one epoch)		for(n = 0; n < nRowCount; n++)		{			// Compute output for this row and update the weights			pRow = m_pTrainingDataInternal->GetVector(n);			EvalInternal(pRow);			// Backpropagate the error			Criticize(pRow);			// Adjust the weight delta in a gradient descent manner			for(i = 0; i < m_nInputStart; i++)			{				pNeuron = (GNeuron*)m_pNeurons->GetPointer(i);				pNeuron->BatchUpdateDeltas(m_dLearningRate);			}		}		// Adjust the weights by the sum weight delta		for(i = 0; i < m_nInputStart; i++)		{			pNeuron = (GNeuron*)m_pNeurons->GetPointer(i);			pNeuron->BatchUpdateWeights();		}		m_dLearningRate *= m_dLearningDecay;		// Check for termination condition		nEpochsSinceValidationCheck++;		if(nEpochsSinceValidationCheck >= m_nEpochsPerValidationCheck)		{			nEpochsSinceValidationCheck = 0;			double dMeanSquareError = TrainValidate();//printf("Epoch: %d\tError=%lf\n", nEpochs, dBestError);			if(dMeanSquareError < dBestError)			{				// Found a new best set of weights				dBestError = dMeanSquareError;				nBestEpoch = nEpochs;				UpdateBestWeights();				if(dMeanSquareError <= m_dAcceptableMeanSquareError)					break;			}			else			{				// Test for termination condition				if(nEpochs - nBestEpoch >= m_nRunEpochs)					break;			}			if(nEpochs >= m_nMaximumEpochs)				break;		}	}	if(dBestError < 1e20)		RestoreBestWeights();	else	{		GAssert(false, "Total failure!");	}	ReleaseInternalData();	return nEpochs;}
gneuralnet.cpp - 源码说明

本页面展示了「一个由Mike Gashler完成的机器学习方面的includes neural net, naive bayesian classifier, decision tree, KNN, a genet」中的 gneuralnet.cpp 源码文件，采用 C++ 编程语言编写，共 996 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。
虫虫下载站收录了大量与classifier相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。
⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?