cpp-ml-library/NeuralNetwork_8hpp_source.html

 #ifndef NEURAL_NETWORK_HPP

 #define NEURAL_NETWORK_HPP


 #include <vector>

 #include <cmath>

 #include <cstdlib>

 #include <cassert>

 #include <iostream>


 struct Connection {

     double weight;

     double deltaWeight;

 };


 class Neuron {

 public:

     Neuron(unsigned numOutputs, unsigned index);


     void setOutputVal(double val);


     double getOutputVal() const;


     void feedForward(const std::vector<Neuron>& prevLayer);


     void calcOutputGradients(double targetVal);


     void calcHiddenGradients(const std::vector<Neuron>& nextLayer);


     void updateInputWeights(std::vector<Neuron>& prevLayer);


 private:

     static double randomWeight();


     static double activationFunction(double x);


     static double activationFunctionDerivative(double x);


     double sumDOW(const std::vector<Neuron>& nextLayer) const;


     double m_outputVal;

     std::vector<Connection> m_outputWeights;

     unsigned m_myIndex;

     double m_gradient;


     // Hyperparameters

     static double eta;

     static double alpha;

 };


 // Initialize static members

 double Neuron::eta = 0.15;   // Learning rate

 double Neuron::alpha = 0.5;  // Momentum


 Neuron::Neuron(unsigned numOutputs, unsigned index)

     : m_myIndex(index)

 {

     for (unsigned c = 0; c < numOutputs; ++c) {

         Connection conn;

         conn.weight = randomWeight();

         conn.deltaWeight = 0.0;

         m_outputWeights.push_back(conn);

     }

 }


 void Neuron::setOutputVal(double val) {

     m_outputVal = val;

 }


 double Neuron::getOutputVal() const {

     return m_outputVal;

 }


 void Neuron::feedForward(const std::vector<Neuron>& prevLayer) {

     double sum = 0.0;


     // Sum the previous layer's outputs (which are our inputs)

     // Include the bias node from the previous layer.

     for (size_t n = 0; n < prevLayer.size(); ++n) {

         sum += prevLayer[n].getOutputVal() * prevLayer[n].m_outputWeights[m_myIndex].weight;

     }


     m_outputVal = Neuron::activationFunction(sum);

 }


 void Neuron::calcOutputGradients(double targetVal) {

     double delta = targetVal - m_outputVal;

     m_gradient = delta * Neuron::activationFunctionDerivative(m_outputVal);

 }


 void Neuron::calcHiddenGradients(const std::vector<Neuron>& nextLayer) {

     double dow = sumDOW(nextLayer);

     m_gradient = dow * Neuron::activationFunctionDerivative(m_outputVal);

 }


 void Neuron::updateInputWeights(std::vector<Neuron>& prevLayer) {

     // Update the weights in the previous layer

     for (size_t n = 0; n < prevLayer.size(); ++n) {

         Neuron& neuron = prevLayer[n];

         double oldDeltaWeight = neuron.m_outputWeights[m_myIndex].deltaWeight;


         double newDeltaWeight =

             // Individual input, magnified by the gradient and train rate:

             eta * neuron.getOutputVal() * m_gradient

             // Also add momentum = a fraction of the previous delta weight

             + alpha * oldDeltaWeight;


         neuron.m_outputWeights[m_myIndex].deltaWeight = newDeltaWeight;

         neuron.m_outputWeights[m_myIndex].weight += newDeltaWeight;

     }

 }


 double Neuron::randomWeight() {

     return rand() / double(RAND_MAX);

 }


 double Neuron::activationFunction(double x) {

     // Hyperbolic tangent activation function

     return tanh(x);

 }


 double Neuron::activationFunctionDerivative(double x) {

     // Derivative of tanh activation function

     return 1.0 - x * x;

 }


 double Neuron::sumDOW(const std::vector<Neuron>& nextLayer) const {

     double sum = 0.0;


     // Sum our contributions of the errors at the nodes we feed

     for (size_t n = 0; n < nextLayer.size() - 1; ++n) {

         sum += m_outputWeights[n].weight * nextLayer[n].m_gradient;

     }


     return sum;

 }


 class NeuralNetwork {

 public:

     NeuralNetwork(const std::vector<unsigned>& topology);


     void feedForward(const std::vector<double>& inputVals);


     void backProp(const std::vector<double>& targetVals);


     void getResults(std::vector<double>& resultVals) const;


     double getRecentAverageError() const;


 private:

     std::vector<std::vector<Neuron>> m_layers;

     double m_error;

     double m_recentAverageError;

     static double m_recentAverageSmoothingFactor;

 };


 // Initialize static members

 double NeuralNetwork::m_recentAverageSmoothingFactor = 100.0;


 NeuralNetwork::NeuralNetwork(const std::vector<unsigned>& topology) {

     size_t numLayers = topology.size();

     for (size_t layerNum = 0; layerNum < numLayers; ++layerNum) {

         m_layers.push_back(std::vector<Neuron>());

         unsigned numOutputs = (layerNum == topology.size() - 1) ? 0 : topology[layerNum + 1];


         // Add neurons to the layer, including a bias neuron

         for (unsigned neuronNum = 0; neuronNum <= topology[layerNum]; ++neuronNum) {

             m_layers.back().push_back(Neuron(numOutputs, neuronNum));

             // std::cout << "Created a Neuron!" << std::endl;

         }


         // Force the bias node's output value to 1.0

         m_layers.back().back().setOutputVal(1.0);

     }

 }


 void NeuralNetwork::feedForward(const std::vector<double>& inputVals) {

     assert(inputVals.size() == m_layers[0].size() - 1);


     // Assign the input values to the input neurons

     for (size_t i = 0; i < inputVals.size(); ++i) {

         m_layers[0][i].setOutputVal(inputVals[i]);

     }


     // Forward propagation

     for (size_t layerNum = 1; layerNum < m_layers.size(); ++layerNum) {

         std::vector<Neuron>& prevLayer = m_layers[layerNum - 1];

         for (size_t n = 0; n < m_layers[layerNum].size() - 1; ++n) {

             m_layers[layerNum][n].feedForward(prevLayer);

         }

     }

 }


 void NeuralNetwork::backProp(const std::vector<double>& targetVals) {

     // Calculate overall net error (RMS of output neuron errors)

     std::vector<Neuron>& outputLayer = m_layers.back();

     m_error = 0.0;


     for (size_t n = 0; n < outputLayer.size() - 1; ++n) {

         double delta = targetVals[n] - outputLayer[n].getOutputVal();

         m_error += delta * delta;

     }

     m_error /= outputLayer.size() - 1; // Get average squared error

     m_error = sqrt(m_error);           // RMS


     // Implement a recent average measurement

     m_recentAverageError =

         (m_recentAverageError * m_recentAverageSmoothingFactor + m_error)

         / (m_recentAverageSmoothingFactor + 1.0);


     // Calculate output layer gradients

     for (size_t n = 0; n < outputLayer.size() - 1; ++n) {

         outputLayer[n].calcOutputGradients(targetVals[n]);

     }


     // Calculate gradients on hidden layers

     for (size_t layerNum = m_layers.size() - 2; layerNum > 0; --layerNum) {

         std::vector<Neuron>& hiddenLayer = m_layers[layerNum];

         std::vector<Neuron>& nextLayer = m_layers[layerNum + 1];


         for (size_t n = 0; n < hiddenLayer.size(); ++n) {

             hiddenLayer[n].calcHiddenGradients(nextLayer);

         }

     }


     // Update connection weights for all layers (from output to first hidden layer)

     for (size_t layerNum = m_layers.size() - 1; layerNum > 0; --layerNum) {

         std::vector<Neuron>& layer = m_layers[layerNum];

         std::vector<Neuron>& prevLayer = m_layers[layerNum - 1];


         for (size_t n = 0; n < layer.size() - 1; ++n) {

             layer[n].updateInputWeights(prevLayer);

         }

     }

 }


 void NeuralNetwork::getResults(std::vector<double>& resultVals) const {

     resultVals.clear();

     const std::vector<Neuron>& outputLayer = m_layers.back();

     for (size_t n = 0; n < outputLayer.size() - 1; ++n) {

         resultVals.push_back(outputLayer[n].getOutputVal());

     }

 }


 double NeuralNetwork::getRecentAverageError() const {

     return m_recentAverageError;

 }


 #endif // NEURAL_NETWORK_HPP

NeuralNetwork
Represents the neural network consisting of layers of neurons.
Definition: NeuralNetwork.hpp:202

NeuralNetwork::backProp
void backProp(const std::vector< double > &targetVals)
Performs backpropagation to adjust weights.
Definition: NeuralNetwork.hpp:278

NeuralNetwork::NeuralNetwork
NeuralNetwork(const std::vector< unsigned > &topology)
Constructs a NeuralNetwork with the given topology.
Definition: NeuralNetwork.hpp:244

NeuralNetwork::feedForward
void feedForward(const std::vector< double > &inputVals)
Feeds the input values forward through the network.
Definition: NeuralNetwork.hpp:261

NeuralNetwork::getResults
void getResults(std::vector< double > &resultVals) const
Gets the results from the output layer.
Definition: NeuralNetwork.hpp:321

NeuralNetwork::getRecentAverageError
double getRecentAverageError() const
Gets the recent average error of the network.
Definition: NeuralNetwork.hpp:329

Neuron
Represents a single neuron in the neural network.
Definition: NeuralNetwork.hpp:28

Neuron::setOutputVal
void setOutputVal(double val)
Sets the output value of the neuron.
Definition: NeuralNetwork.hpp:126

Neuron::feedForward
void feedForward(const std::vector< Neuron > &prevLayer)
Feeds forward the input values to the next layer.
Definition: NeuralNetwork.hpp:134

Neuron::Neuron
Neuron(unsigned numOutputs, unsigned index)
Constructs a Neuron.
Definition: NeuralNetwork.hpp:115

Neuron::updateInputWeights
void updateInputWeights(std::vector< Neuron > &prevLayer)
Updates the input weights for the neuron.
Definition: NeuralNetwork.hpp:156

Neuron::calcHiddenGradients
void calcHiddenGradients(const std::vector< Neuron > &nextLayer)
Calculates the hidden gradients for hidden layers.
Definition: NeuralNetwork.hpp:151

Neuron::getOutputVal
double getOutputVal() const
Gets the output value of the neuron.
Definition: NeuralNetwork.hpp:130

Neuron::calcOutputGradients
void calcOutputGradients(double targetVal)
Calculates the output gradients for the output layer.
Definition: NeuralNetwork.hpp:146

Connection
Represents a connection between neurons with a weight and a change in weight.
Definition: NeuralNetwork.hpp:19

Connection::deltaWeight
double deltaWeight
The change in weight (for momentum).
Definition: NeuralNetwork.hpp:21

Connection::weight
double weight
The weight of the connection.
Definition: NeuralNetwork.hpp:20