uesmanncpp/html/uesnet_8hpp_source.html

 #ifndef __UESNET_HPP
 #define __UESNET_HPP


 class UESNet: public BPNet {
     double modulator;
 public:
     UESNet(int nlayers,const int *layerCounts) : BPNet(nlayers,layerCounts),
           modulator(0)
     {
         // replace the net type, it's not a plain net any more
         type = NetType::UESMANN;

     }

     virtual void setH(double h){
         modulator = h;
     }

     virtual double getH() const {
         return modulator;
     }

 protected:

     void calcError(double *in,double *out){
         // first run the network forwards
         setInputs(in);
         update();

         // first, calculate the error in the output layer
         // This does the THIRD of the backprop equations, Eq. 4.15, giving dLj.
         int ol = numLayers-1;
         for(int i=0;i<layerSizes[ol];i++){
             double o = outputs[ol][i];
             errors[ol][i] = o*(1-o)*(o-out[i]);
         }

         // then work out the errors in all the other layers
         // factoring in (rather inefficiently) the hormone.
         // This is the FOURTH backprop equation, Eq. 4.16.
         for(int l=1;l<numLayers-1;l++){
             for(int j=0;j<layerSizes[l];j++){
                 double e = 0;
                 for(int i=0;i<layerSizes[l+1];i++)
                     e += errors[l+1][i]*getw(l+1,i,j);

                 // produce the \delta^l_i term where l is the layer and i
                 // the index of the node. Here is where we factor in the modulator.

                 errors[l][j] = e * (modulator+1.0) * outputs[l][j] * (1-outputs[l][j]);
             }
         }
     }

     virtual void update(){
         double hfactor = modulator+1.0;
         for(int i=1;i<numLayers;i++){
             for(int j=0;j<layerSizes[i];j++){
                 double v = 0.0;
                 for(int k=0;k<layerSizes[i-1];k++){
                     v += getw(i,j,k) * outputs[i-1][k];
                 }
                 // factor in the hormone here
                 outputs[i][j]=sigmoid(v*hfactor+biases[i][j]);
             }
         }
     }

     virtual double trainBatch(ExampleSet& ex,int start,int num,double eta){
         // zero average gradients
         for(int j=0;j<numLayers;j++){
             for(int k=0;k<layerSizes[j];k++)
                 gradAvgsBiases[j][k]=0;
             for(int i=0;i<largestLayerSize*largestLayerSize;i++)
                 gradAvgsWeights[j][i]=0;
         }

         // reset total error
         double totalError=0;
         // iterate over examples
         for(int nn=0;nn<num;nn++){
             int exampleIndex = nn+start;
             // set modulator
             setH(ex.getH(exampleIndex));
             // get outputs for this example
             double *outs = ex.getOutputs(exampleIndex);
             // build errors for each example
             calcError(ex.getInputs(exampleIndex),outs);

             // accumulate errors
             for(int l=1;l<numLayers;l++){
                 for(int i=0;i<layerSizes[l];i++){
                     // this does the FIRST of the backprop equations,
                     // Eq. 4.13, calculating dC/dw(h+1), but the modulator
                     // is dealt with below.
                     for(int j=0;j<layerSizes[l-1];j++)
                         getavggradw(l,i,j) += errors[l][i]*outputs[l-1][j];
                     // this does the SECOND of the backprop equations,
                     // Eq. 4.14.
                     gradAvgsBiases[l][i] += errors[l][i];
                 }
             }
             // count up the total error
             int ol = numLayers-1;
             for(int i=0;i<layerSizes[ol];i++){
                 double o = outputs[ol][i];
                 double e = (o-outs[i]);
                 totalError += e*e;
             }
         }

         // get modulator factor
         double hfactor = modulator+1.0;


         // for calculating average error - 1/number of examples trained
         double factor = 1.0/(double)num;
         // we now have a full set of running averages. Time to apply them.
         for(int l=1;l<numLayers;l++){
             for(int i=0;i<layerSizes[l];i++){
                 for(int j=0;j<layerSizes[l-1];j++){
                     // this does the modulation part of Eq. 4.13, but a little
                     // later than in the thesis.
                     double wdelta = eta*getavggradw(l,i,j)*factor*hfactor;
                     //                    printf("WCORR: %f factor %f\n",wdelta,getavggradw(l,i,j));
                     getw(l,i,j) -= wdelta;
                 }
                 // biases are not modulated
                 double bdelta = eta*gradAvgsBiases[l][i]*factor;
                 biases[l][i] -= bdelta;
             }
         }
         // and return total error - this is the SUM of the MSE of each output
         return totalError*factor;
     }
 };

 #endif /* __UESNET_HPP */
BPNet::setInputs
virtual void setInputs(double *d)
Set the inputs to the network before running or training.
Definition: bpnet.hpp:104

BPNet::gradAvgsBiases
double ** gradAvgsBiases
average gradient for each bias (built during training)
Definition: bpnet.hpp:216

BPNet::numLayers
int numLayers
number of layers, including input and output
Definition: bpnet.hpp:190

BPNet::biases
double ** biases
array of biases, stored as a rectangular array of [layer][node]
Definition: bpnet.hpp:208

UESNet::calcError
void calcError(double *in, double *out)
Definition: uesnet.hpp:46

BPNet::getavggradw
double & getavggradw(int tolayer, int toneuron, int fromneuron) const
get the value of the gradient for a given weight
Definition: bpnet.hpp:272

BPNet
The "basic" back-propagation network using a logistic sigmoid, as described by Rumelhart, Hinton and Williams (and many others). This class is used by output blending and h-as-input networks.
Definition: bpnet.hpp:18

UESNet::UESNet
UESNet(int nlayers, const int *layerCounts)
The constructor is mostly identical to the BPNet constructor.
Definition: uesnet.hpp:28

UESNet::update
virtual void update()
Run a single update of the network.
Definition: uesnet.hpp:76

ExampleSet::getOutputs
double * getOutputs(int example)
Get a pointer to the outputs for a given example, for reading or writing.
Definition: data.hpp:349

sigmoid
double sigmoid(double x)
Definition: net.hpp:20

BPNet::getw
double & getw(int tolayer, int toneuron, int fromneuron) const
get the value of a weight.
Definition: bpnet.hpp:249

UESNet::setH
virtual void setH(double h)
Set the modulator level for subsequent runs and training of this network.
Definition: uesnet.hpp:36

BPNet::outputs
double ** outputs
outputs of each layer: one array of doubles for each
Definition: bpnet.hpp:212

BPNet::errors
double ** errors
the error for each node, calculated by calcError()
Definition: bpnet.hpp:213

Net::type
NetType type
type of the network, used for load/save
Definition: net.hpp:49

NetType::UESMANN
h-as-input

UESNet
The UESMANN network, which it itself based on the BPNet code as it has the same architecture as the p...
Definition: uesnet.hpp:17

ExampleSet::getH
double getH(int example) const
Get the h (modulator) for a given example.
Definition: data.hpp:359

BPNet::gradAvgsWeights
double ** gradAvgsWeights
average gradient for each weight (built during training)
Definition: bpnet.hpp:215

UESNet::getH
virtual double getH() const
get the modulator level
Definition: uesnet.hpp:40

BPNet::largestLayerSize
int largestLayerSize
number of nodes in largest layer
Definition: bpnet.hpp:192

ExampleSet::getInputs
double * getInputs(int example)
Get a pointer to the inputs for a given example, for reading or writing.
Definition: data.hpp:338

UESNet::trainBatch
virtual double trainBatch(ExampleSet &ex, int start, int num, double eta)
Train a network for batch (or mini-batch) (or single example).
Definition: uesnet.hpp:90

ExampleSet
A set of example data. Each datum consists of hormone (i.e. modulator value), inputs and outputs...
Definition: data.hpp:57

BPNet::layerSizes
int * layerSizes
array of layer sizes
Definition: bpnet.hpp:191