uesmanncpp/html/bpnet_8hpp_source.html

 #ifndef __BPNET_HPP
 #define __BPNET_HPP

 #include "net.hpp"

 class BPNet : public Net {
 protected:
     BPNet() : Net (NetType::PLAIN) {
     }

     void init(int nlayers,const int *layerCounts){
         numLayers = nlayers;
         outputs = new double* [numLayers];
         errors = new double* [numLayers];
         layerSizes = new int [numLayers];
         largestLayerSize=0;
         for(int i=0;i<numLayers;i++){
             int n = layerCounts[i];
             outputs[i] = new double[n];
             errors[i] = new double[n];
             for(int k=0;k<n;k++)
                 outputs[i][k]=0;
             layerSizes[i]=n;
             if(n>largestLayerSize)
                 largestLayerSize=n;
         }

         weights = new double * [numLayers];
         gradAvgsWeights = new double* [numLayers];
         biases = new double* [numLayers];
         gradAvgsBiases = new double* [numLayers];
         for(int i=0;i<numLayers;i++){
             int n = layerCounts[i];
             weights[i] = new double[largestLayerSize*largestLayerSize];
             gradAvgsWeights[i] = new double[largestLayerSize*largestLayerSize];
             biases[i] = new double[n];
             gradAvgsBiases[i] = new double[n];
         }
     }

 public:
     BPNet(int nlayers,const int *layerCounts) : Net(NetType::PLAIN) {
         init(nlayers,layerCounts);
     }

     virtual void setH(double h){
         // does nothing, because this is an unmodulated net.
     }

     virtual double getH() const {
         return 0;
     }


     virtual ~BPNet(){
         for(int i=0;i<numLayers;i++){
             delete [] weights[i];
             delete [] biases[i];
             delete [] gradAvgsWeights[i];
             delete [] gradAvgsBiases[i];
             delete [] outputs[i];
             delete [] errors[i];
         }
         delete [] weights;
         delete [] biases;
         delete [] gradAvgsWeights;
         delete [] gradAvgsBiases;
         delete [] outputs;
         delete [] errors;
         delete [] layerSizes;
     }

     virtual void setInputs(double *d) {
         for(int i=0;i<layerSizes[0];i++){
             outputs[0][i]=d[i];
         }
     }

     void setInput(int n, double d){
         outputs[0][n] = d;
     }


     virtual double *getOutputs() const {
         return outputs[numLayers-1];
     }

     virtual int getLayerSize(int n) const {
         return layerSizes[n];
     }

     virtual int getLayerCount() const {
         return numLayers;
     }


     virtual int getDataSize() const {
         // number of weights+biases for each layer is
         // the number of nodes in that layer (bias count)
         // times the number of nodes in the previous layer.
         //
         // NOTE THAT this uses the true layer size rather than
         // the fake version returned in the subclass HInputNet
         int pc=0;
         int total=0;
         for(int i=0;i<numLayers;i++){
             int c = layerSizes[i];
             total += c*(1+pc);
             pc = c;
         }
         return total;
     }

     virtual void save(double *buf) const {
         double *g=buf;
         // data is ordered by layers, with nodes within
         // layers, and each node is bias then weights.
         //
         // NOTE THAT this uses the true layer size rather than
         // the fake version returned in the subclass HInputNet
         for(int i=0;i<numLayers;i++){
             for(int j=0;j<layerSizes[i];j++){
                 *g++ = biases[i][j];
                 if(i){
                     for(int k=0;k<layerSizes[i-1];k++){
                         *g++ = getw(i,j,k);
                     }
                 }
             }
         }
     }

     virtual void load(double *buf){
         double *g=buf;
         // genome is ordered by layers, with nodes within
         // layers, and each node is bias then weights.
         //
         // NOTE THAT this uses the true layer size rather than
         // the fake version returned in the subclass HInputNet
         for(int i=0;i<numLayers;i++){
             for(int j=0;j<layerSizes[i];j++){
                 biases[i][j]=*g++;
                 if(i){
                     for(int k=0;k<layerSizes[i-1];k++){
                         getw(i,j,k) = *g++;
                     }
                 }
             }
         }
     }

 protected:
     int numLayers;
     int *layerSizes;
     int largestLayerSize;

     double **weights;

     double **biases;

     // data generated during training and running

     double **outputs;
     double **errors;

     double **gradAvgsWeights;
     double **gradAvgsBiases;

     virtual void initWeights(double initr){
         for(int i=0;i<numLayers;i++){
             double initrange;
             if(i){
                 double ct = layerSizes[i-1];
                 if(initr>0)
                     initrange = initr;
                 else
                     initrange = 1.0/sqrt(ct); // from Bishop
             } else
                 initrange = 0.1; // on input layer, should mean little.
             for(int j=0;j<layerSizes[i];j++)
                 biases[i][j]=drand(-initrange,initrange);
             for(int j=0;j<largestLayerSize*largestLayerSize;j++){
                 weights[i][j]=drand(-initrange,initrange);
             }
         }
         // zero the input layer weights, which should be unused.
         for(int j=0;j<layerSizes[0];j++)
             biases[0][j]=0;
         for(int j=0;j<largestLayerSize*largestLayerSize;j++)
             weights[0][j]=0;
     }

     inline double& getw(int tolayer,int toneuron,int fromneuron) const {
         return weights[tolayer][toneuron+largestLayerSize*fromneuron];
     }

     inline double& getb(int layer,int neuron) const {
         return biases[layer][neuron];
     }


     inline double& getavggradw(int tolayer,int toneuron,int fromneuron) const {
         return gradAvgsWeights[tolayer][toneuron+largestLayerSize*fromneuron];
     }

     inline double getavggradb(int l,int n) const {
         return gradAvgsBiases[l][n];
     }

     void calcError(double *in,double *out){
         // first run the network forwards
         setInputs(in);
         update();

         // first, calculate the error in the output layer
         int ol = numLayers-1;
         for(int i=0;i<layerSizes[ol];i++){
             double o = outputs[ol][i];
             errors[ol][i] = o*(1-o)*(o-out[i]);
         }

         // then work out the errors in all the other layers
         for(int l=1;l<numLayers-1;l++){
             for(int j=0;j<layerSizes[l];j++){
                 double e = 0;
                 for(int i=0;i<layerSizes[l+1];i++)
                     e += errors[l+1][i]*getw(l+1,i,j);

                 // produce the \delta^l_i term where l is the layer and i
                 // the index of the node
                 errors[l][j] = e * outputs[l][j] * (1-outputs[l][j]);
             }
         }
     }

     virtual void update(){
         for(int i=1;i<numLayers;i++){
             for(int j=0;j<layerSizes[i];j++){
                 double v = biases[i][j];
                 for(int k=0;k<layerSizes[i-1];k++){
                     v += getw(i,j,k) * outputs[i-1][k];
                 }
                 outputs[i][j]=sigmoid(v);
             }
         }
     }

     virtual double trainBatch(ExampleSet& ex,int start,int num,double eta){
         // zero average gradients
         for(int j=0;j<numLayers;j++){
             for(int k=0;k<layerSizes[j];k++)
                 gradAvgsBiases[j][k]=0;
             for(int i=0;i<largestLayerSize*largestLayerSize;i++)
                 gradAvgsWeights[j][i]=0;
         }

         // reset total error
         double totalError=0;
         // iterate over examples
         for(int nn=0;nn<num;nn++){
             int exampleIndex = nn+start;
             // set modulator
             setH(ex.getH(exampleIndex));
             // get outputs for this example
             double *outs = ex.getOutputs(exampleIndex);
             // build errors for each example
             calcError(ex.getInputs(exampleIndex),outs);

             // accumulate errors
             for(int l=1;l<numLayers;l++){
                 for(int i=0;i<layerSizes[l];i++){
                     for(int j=0;j<layerSizes[l-1];j++)
                         getavggradw(l,i,j) += errors[l][i]*outputs[l-1][j];
                     gradAvgsBiases[l][i] += errors[l][i];
                 }
             }
             // count up the total error
             int ol = numLayers-1;
             for(int i=0;i<layerSizes[ol];i++){
                 double o = outputs[ol][i];
                 double e = (o-outs[i]);
                 totalError += e*e;
             }
         }

         // for calculating average error - 1/number of examples trained
         double factor = 1.0/(double)num;
         // we now have a full set of running averages. Time to apply them.
         for(int l=1;l<numLayers;l++){
             for(int i=0;i<layerSizes[l];i++){
                 for(int j=0;j<layerSizes[l-1];j++){
                     double wdelta = eta*getavggradw(l,i,j)*factor;
 //                    printf("WCORR: %f factor %f\n",wdelta,getavggradw(l,i,j));
                     getw(l,i,j) -= wdelta;
                 }
                 double bdelta = eta*gradAvgsBiases[l][i]*factor;
                 biases[l][i] -= bdelta;
             }
         }
         // and return total error - this is the SUM of the MSE of each output
         return totalError*factor;
     }
 };


 #endif /* __BPNET_HPP */
BPNet::BPNet
BPNet(int nlayers, const int *layerCounts)
Constructor - does not initialise the weights to random values so that we can reinitialise networks...
Definition: bpnet.hpp:69

NetType
NetType
The different types of network - each has an associated integer for saving/loading file data...
Definition: netType.hpp:15

BPNet::setInputs
virtual void setInputs(double *d)
Set the inputs to the network before running or training.
Definition: bpnet.hpp:104

BPNet::gradAvgsBiases
double ** gradAvgsBiases
average gradient for each bias (built during training)
Definition: bpnet.hpp:216

BPNet::BPNet
BPNet()
Special constructor for subclasses which need to manipulate layer count before initialisation (e...
Definition: bpnet.hpp:24

BPNet::init
void init(int nlayers, const int *layerCounts)
Initialiser for use by the main constructor and the ctors of those subclasses mentioned in BPNet() ...
Definition: bpnet.hpp:32

BPNet::calcError
void calcError(double *in, double *out)
run a single example and calculate the errors; used in training.
Definition: bpnet.hpp:294

BPNet::numLayers
int numLayers
number of layers, including input and output
Definition: bpnet.hpp:190

BPNet::biases
double ** biases
array of biases, stored as a rectangular array of [layer][node]
Definition: bpnet.hpp:208

net.hpp
This is the abstract basic network class - the training methods are in each subclass.

BPNet::getavggradw
double & getavggradw(int tolayer, int toneuron, int fromneuron) const
get the value of the gradient for a given weight
Definition: bpnet.hpp:272

BPNet::load
virtual void load(double *buf)
Given that the pointer points to a data block of the correct size for the current network...
Definition: bpnet.hpp:170

NetType::PLAIN

BPNet
The "basic" back-propagation network using a logistic sigmoid, as described by Rumelhart, Hinton and Williams (and many others). This class is used by output blending and h-as-input networks.
Definition: bpnet.hpp:18

ExampleSet::getOutputs
double * getOutputs(int example)
Get a pointer to the outputs for a given example, for reading or writing.
Definition: data.hpp:349

sigmoid
double sigmoid(double x)
Definition: net.hpp:20

BPNet::update
virtual void update()
Run a single update of the network.
Definition: bpnet.hpp:320

BPNet::trainBatch
virtual double trainBatch(ExampleSet &ex, int start, int num, double eta)
Train a network for batch (or mini-batch) (or single example).
Definition: bpnet.hpp:332

BPNet::save
virtual void save(double *buf) const
Serialize the data (not including any network type magic number or layer/node counts) to the given me...
Definition: bpnet.hpp:151

BPNet::getw
double & getw(int tolayer, int toneuron, int fromneuron) const
get the value of a weight.
Definition: bpnet.hpp:249

BPNet::getDataSize
virtual int getDataSize() const
Get the length of the serialised data block for this network.
Definition: bpnet.hpp:134

BPNet::getb
double & getb(int layer, int neuron) const
get the value of a bias
Definition: bpnet.hpp:259

BPNet::initWeights
virtual void initWeights(double initr)
initialise weights to random values
Definition: bpnet.hpp:218

BPNet::getavggradb
double getavggradb(int l, int n) const
get the value of a bias gradient
Definition: bpnet.hpp:283

BPNet::setH
virtual void setH(double h)
Set the modulator level for subsequent runs and training of this network.
Definition: bpnet.hpp:73

BPNet::outputs
double ** outputs
outputs of each layer: one array of doubles for each
Definition: bpnet.hpp:212

BPNet::errors
double ** errors
the error for each node, calculated by calcError()
Definition: bpnet.hpp:213

BPNet::getLayerCount
virtual int getLayerCount() const
Get the number of layers.
Definition: bpnet.hpp:128

BPNet::getLayerSize
virtual int getLayerSize(int n) const
Get the number of nodes in a given layer.
Definition: bpnet.hpp:124

BPNet::getOutputs
virtual double * getOutputs() const
Get the outputs after running.
Definition: bpnet.hpp:120

BPNet::~BPNet
virtual ~BPNet()
destructor
Definition: bpnet.hpp:86

BPNet::setInput
void setInput(int n, double d)
Used to set inputs manually, typically in HInputNet.
Definition: bpnet.hpp:115

ExampleSet::getH
double getH(int example) const
Get the h (modulator) for a given example.
Definition: data.hpp:359

BPNet::gradAvgsWeights
double ** gradAvgsWeights
average gradient for each weight (built during training)
Definition: bpnet.hpp:215

BPNet::getH
virtual double getH() const
get the modulator level
Definition: bpnet.hpp:77

BPNet::weights
double ** weights
Array of weights as [tolayer][tonode+largestLayerSize*fromnode].
Definition: bpnet.hpp:205

Net
The abstract network type upon which all others are based. It&#39;s not pure virtual, in that it encapsul...
Definition: net.hpp:39

BPNet::largestLayerSize
int largestLayerSize
number of nodes in largest layer
Definition: bpnet.hpp:192

ExampleSet::getInputs
double * getInputs(int example)
Get a pointer to the inputs for a given example, for reading or writing.
Definition: data.hpp:338

Net::drand
double drand(double mn, double mx)
get a random number using this net&#39;s PRNG data
Definition: net.hpp:591

ExampleSet
A set of example data. Each datum consists of hormone (i.e. modulator value), inputs and outputs...
Definition: data.hpp:57

BPNet::layerSizes
int * layerSizes
array of layer sizes
Definition: bpnet.hpp:191