uesmanncpp/html/net_8hpp_source.html

 #ifndef __NET_HPP
 #define __NET_HPP

 #include <math.h>

 #include "netType.hpp"
 #include "data.hpp"

 inline double sigmoid(double x){
     return 1.0/(1.0+exp(-x));
 }

 inline double sigmoidDiff(double x){
     double s = sigmoid(x);
     return (1.0-s)*s;
 }

 class Net {
     friend class OutputBlendingNet;
     friend class HInputNet;
 public:

     virtual ~Net() {}

     NetType type;
     drand48_data rd;

     void setSeed(long seed){
         srand48_r(seed,&rd);
     }

     virtual int getLayerSize(int n) const =0;

     virtual int getLayerCount() const =0;

     int getInputCount() const {
         return getLayerSize(0);
     }

     int getOutputCount() const {
         return getLayerSize(getLayerCount()-1);
     }


     virtual void setInputs(double *d) = 0;

     virtual double *getOutputs() const = 0;

     double *run(double *in) {
         setInputs(in);
         update();
         return getOutputs();
     }

     virtual void setH(double h)=0;

     virtual double getH() const =0;

     double test(ExampleSet& examples,int start=0,int num=-1){
         double mseSum = 0;
         // have to do this here, too, although runExamples does it, so we can
         // get the denominator for the mse.
         if(num<0)num=examples.getCount()-start;

         // for each example, run it and accumulate the sum of squared errors
         // on all outputs

         for(int i=0;i<num;i++){
             int idx = start+i;
             setH(examples.getH(idx));
             double *netout = run(examples.getInputs(idx));
             double *exout = examples.getOutputs(idx);
             for(int j=0;j<examples.getOutputCount();j++){
                 double d = netout[j]-exout[j];
                 mseSum += d*d;
             }
         }

         // we then divide by the number of examples and the output count.
         return mseSum / (num * examples.getOutputCount());
     }

     struct SGDParams {
         friend class Net;

         int iterations;

         double eta;


         int nSlices;

         int nPerSlice;

         int cvInterval;

         SGDParams& crossValidationManual(int slices,int nperslice,int interval){
             nSlices = slices;
             nPerSlice = nperslice;
             cvInterval = interval;
             return *this;
         }

         ExampleSet::ShuffleMode shuffleMode;

         SGDParams& setShuffle(ExampleSet::ShuffleMode m){
             shuffleMode = m;
             return *this;
         }


         bool selectBestWithCV;

         SGDParams& setSelectBestWithCV(bool v=true){
             selectBestWithCV=v;
             return *this;
         }


         bool cvShuffle;

         SGDParams& setCVShuffle(bool v=true){
             cvShuffle=v;
             return *this;
         }

         int initrange;

         SGDParams& setInitRange(double range=-1){
             initrange = range;
             return *this;
         }

         long seed;

         SGDParams& setSeed(long v){
             seed = v;
             return *this;
         }

         double *bestNetBuffer;

         bool storeBestNet;

     private:
         void init(double _eta,int _iters){
             seed = 0L;
             eta = _eta;
             iterations = _iters;
             initrange = -1;
             bestNetBuffer = NULL;
             ownsBestNetBuffer = false;
             storeBestNet = false;
             nSlices=0;
             nPerSlice=0;
             cvInterval=1;
             shuffleMode = ExampleSet::STRIDE;
             selectBestWithCV=false; // there might not be CV!
             cvShuffle = true; // do shuffle CV at the end of an epoch
         }
     public:
         SGDParams(double _eta, int _iters) {
             init(_eta,_iters);
         }

         SGDParams(double _eta,const ExampleSet& examples,int _iters){
             init(_eta,examples.getCount()*_iters);
         }

         ~SGDParams(){
             if(ownsBestNetBuffer)delete[] bestNetBuffer;
         }

         SGDParams &crossValidation(const ExampleSet& examples,
                                    double propCV,
                                    int cvCount,
                                    int cvSlices,
                                    bool cvShuf=true
                                    ){
             cvShuffle = cvShuf;
             // calculate the number of CV examples
             int nCV = (int)round(propCV*examples.getCount());
             if(nCV==0 || nCV>examples.getCount())
                 throw std::out_of_range("Bad cross-validation count");
             if(cvSlices<=0)
                 throw std::out_of_range("Zero (or fewer) CV slices is a bad thing");
             // calculate the number of examples per slice and check it's not zero.
             // The resulting number of CV examples may not agree with nCV above due
             // to the integer division
             nPerSlice = nCV/cvSlices;
             nSlices = cvSlices;
             if(!nPerSlice)
                 throw std::logic_error("Too many slices");
             // calculate the cvInterval
             cvInterval = iterations/cvCount;
             if(cvInterval<=0)
                 throw std::logic_error("Too many CV events");
             // we want to pick the best network by CV rather than training error
             selectBestWithCV=true;

             printf("Cross-validation: %d slices, %d items per slice, %d total\n",
                    nSlices,nPerSlice,nSlices*nPerSlice);
             return *this;
         }

         SGDParams &storeBest(){
             ownsBestNetBuffer = true;
             storeBestNet = true;
             return *this;
         }
     private:
         bool ownsBestNetBuffer;
     };


     double trainSGD(ExampleSet &examples,SGDParams& params){

         // set seed for PRNG
         setSeed(params.seed);

         // separate out the training examples from the cross-validation examples
         int nCV = params.nSlices*params.nPerSlice;
         // it's an error if there are too many CV examples
         if(nCV>=examples.getCount())
             throw std::out_of_range("Too many cross-validation examples");

         if(!nCV && params.selectBestWithCV)
             throw std::logic_error("cannot use CV to select best when no CV is done");

         // get the number of actual training examples
         int nExamples = examples.getCount() - nCV;

         // initialise the network
         initWeights(params.initrange);

         // initialise minimum error to rogue value
         double minError = -1;

         // We don't shuffle before getting the cross-validation examples,
         // because in some cases there's a kind of "fake" cv going on where the
         // training portion and cv portion have to have similar (or identical)
         // distributions. See the boolean test code for an example.
         //        examples.shuffle(&rd,params.shuffleMode);

         // build a temporary subset for the CV examples. This still needs to exist
         // even if we're not using CV, so in that case we'll just
         // use a dummy of one example.

         ExampleSet cvExamples(examples,nCV?examples.getCount()-nCV:0,nCV?nCV:1);


         // setup a countdown for when we cross-validate
         int cvCountdown = params.cvInterval;
         // and which slice we are doing
         int cvSlice = 0;

         // now actually do the training

         FILE *log = fopen("foo","w");
         fprintf(log,"x,slice,y\n");
         for(int i=0;i<params.iterations;i++){
             // find the example number
             int exampleIndex = i % nExamples;

             // at the start of each epoch, reshuffle. This will effectively do an extra shuffle
             // as we've already done it once at the start, before splitting out the CV examples.

             if(exampleIndex == 0)
                 examples.shuffle(&rd,params.shuffleMode,nExamples);

             // train here, just one example, no batching.
             double trainingError = trainBatch(examples,exampleIndex,1,params.eta);

             if(!params.selectBestWithCV){
                 // now test the error and keep the best net. This works differently
                 // if we're doing this by cross-validation or training error. Here
                 // we're using the training error.
                 if(minError < 0 || trainingError < minError){
                     if(params.storeBestNet){
                         if(!params.bestNetBuffer)
                             params.bestNetBuffer = new double[getDataSize()];
                         save(params.bestNetBuffer);
                     }
                     minError = trainingError;
                 }
             }

             // is there cross-validation? If so, do it.

             if(nCV && !--cvCountdown){
                 cvCountdown = params.cvInterval; // reset

                 // test the appropriate slice, from example cvSlice*nPerSlice, length nPerSlice,
                 // and get the MSE
                 double error = test(cvExamples,cvSlice*params.nPerSlice,
                                     params.nPerSlice);
                 fprintf(log,"%d,%d,%f\n",i,cvSlice,error);

                 // test this against the min error as was done above
                 if(params.selectBestWithCV){
                     if(minError < 0 || trainingError < minError){
                         if(params.storeBestNet){
                         if(!params.bestNetBuffer)
                             params.bestNetBuffer = new double[getDataSize()];
                             save(params.bestNetBuffer);
                         }
                         minError = trainingError;
                     }
                 }

                 // increment the slice index
                 cvSlice = (cvSlice+1)%params.nSlices;
                 // if we are now on the first slice, shuffle the entire CV set
                 if(!cvSlice && params.cvShuffle)
                     cvExamples.shuffle(&rd,params.shuffleMode);
             }
         }

         fclose(log);

         // at the end, finalise the network to the best found if we can
         if(params.bestNetBuffer)
             load(params.bestNetBuffer);

         // test on either the entire CV set or the training set and return result
         return test(nCV?cvExamples:examples);
     }

     virtual int getDataSize() const = 0;

     virtual void save(double *buf) const = 0;

     virtual void load(double *buf) = 0;

 protected:


     virtual void update() = 0;

     Net(NetType tp){
         type = tp;
         setSeed(0);
     }

     inline double drand(double mn,double mx){
         double res;
         drand48_r(&rd,&res);
         return res*(mx-mn)+mn;
     }

     virtual void initWeights(double initr) = 0;

     virtual double trainBatch(ExampleSet& ex,int start,int num,double eta) = 0;

 };


 #endif /* __NET_HPP */
ExampleSet::getCount
int getCount() const
get the number of examples
Definition: data.hpp:327

netType.hpp
Contains integer enum for network types.

NetType
NetType
The different types of network - each has an associated integer for saving/loading file data...
Definition: netType.hpp:15

Net::SGDParams::setInitRange
SGDParams & setInitRange(double range=-1)
fluent setter for initrange
Definition: net.hpp:263

Net::SGDParams::initrange
int initrange
range of initial weights/biases [-n,n], or -1 for Bishop&#39;s rule.
Definition: net.hpp:260

Net::getLayerCount
virtual int getLayerCount() const =0
Get the number of layers.

Net::SGDParams::eta
double eta
Definition: net.hpp:186

Net::SGDParams::crossValidationManual
SGDParams & crossValidationManual(int slices, int nperslice, int interval)
fluent setter for cross-validation parameters manually; consider using crossValidation instead ...
Definition: net.hpp:210

Net::SGDParams::setSelectBestWithCV
SGDParams & setSelectBestWithCV(bool v=true)
fluent setter for selectBestWithCV
Definition: net.hpp:239

OutputBlendingNet
A modulatory network architecture which uses two plain backprop networks, each of which is trained se...
Definition: obnet.hpp:18

Net::SGDParams
Training parameters for trainSGD(). This structure holds the parameters for the trainSGD() method...
Definition: net.hpp:173

ExampleSet::ShuffleMode
ShuffleMode
Shuffling mode for shuffle()
Definition: data.hpp:212

Net::SGDParams::crossValidation
SGDParams & crossValidation(const ExampleSet &examples, double propCV, int cvCount, int cvSlices, bool cvShuf=true)
Set up the cross-validation parameters given the full training set, the proportion to be used for CV...
Definition: net.hpp:356

Net::SGDParams::SGDParams
SGDParams(double _eta, int _iters)
Constructor which sets up defaults with no information about examples - cross-validation is not set u...
Definition: net.hpp:323

Net::getInputCount
int getInputCount() const
get the number of inputs
Definition: net.hpp:75

Net::save
virtual void save(double *buf) const =0
Serialize the data (not including any network type magic number or layer/node counts) to the given me...

HInputNet
A modulatory network architecture which uses a plain backprop network with an extra input to carry th...
Definition: hinet.hpp:17

Net::trainSGD
double trainSGD(ExampleSet &examples, SGDParams &params)
Train using stochastic gradient descent. Note that cross-validation parameters are slightly different...
Definition: net.hpp:428

Net::setH
virtual void setH(double h)=0
Set the modulator level for subsequent runs and training of this network.

Net::getOutputCount
int getOutputCount() const
get the number of outputs
Definition: net.hpp:82

sigmoidDiff
double sigmoidDiff(double x)
Definition: net.hpp:28

ExampleSet::getOutputs
double * getOutputs(int example)
Get a pointer to the outputs for a given example, for reading or writing.
Definition: data.hpp:349

Net::SGDParams::cvInterval
int cvInterval
how often to cross-validate given as the interval between CV events: 1 is every iteration, 2 is every other iteration and so on.
Definition: net.hpp:203

Net::getH
virtual double getH() const =0
get the modulator level

Net::getOutputs
virtual double * getOutputs() const =0
Get the outputs after running.

sigmoid
double sigmoid(double x)
Definition: net.hpp:20

Net::SGDParams::nPerSlice
int nPerSlice
the number of example per cross-validation slice
Definition: net.hpp:197

ExampleSet::shuffle
void shuffle(drand48_data *rd, ShuffleMode mode, int nExamples=0)
Shuffle the example using a PRNG and a Fisher-Yates shuffle.
Definition: data.hpp:259

Net::SGDParams::storeBest
SGDParams & storeBest()
set up a "best net buffer" to store the best network found, to which the network will be set on compl...
Definition: net.hpp:394

Net::SGDParams::storeBestNet
bool storeBestNet
true if we should store the best net data
Definition: net.hpp:289

data.hpp
Contains formats for example data.

Net::setInputs
virtual void setInputs(double *d)=0
Set the inputs to the network before running or training.

Net::SGDParams::bestNetBuffer
double * bestNetBuffer
a buffer of at least getDataSize() bytes for the best network. If NULL, the best network is not saved...
Definition: net.hpp:284

Net::getLayerSize
virtual int getLayerSize(int n) const =0
Get the number of nodes in a given layer.

Net::Net
Net(NetType tp)
Constructor - protected because others inherit it and it&#39;s not used directly.
Definition: net.hpp:580

ExampleSet::STRIDE
Shuffle blocks of numHLevels examples, rather than single examples. This is intended for cases where ...
Definition: data.hpp:228

Net::SGDParams::setCVShuffle
SGDParams & setCVShuffle(bool v=true)
fluent setter for cvShuffle
Definition: net.hpp:252

Net::~Net
virtual ~Net()
virtual destructor which does nothing
Definition: net.hpp:47

Net::SGDParams::setSeed
SGDParams & setSeed(long v)
fluent setter for seed
Definition: net.hpp:275

Net::SGDParams::selectBestWithCV
bool selectBestWithCV
if true, use the minimum CV error to find the best net, otherwise use the training error...
Definition: net.hpp:236

Net::run
double * run(double *in)
Run the network on some data.
Definition: net.hpp:107

ExampleSet::getOutputCount
int getOutputCount() const
get the number of outputs in all examples
Definition: data.hpp:319

Net::initWeights
virtual void initWeights(double initr)=0
initialise weights to random values

Net::trainBatch
virtual double trainBatch(ExampleSet &ex, int start, int num, double eta)=0
Train a network for batch (or mini-batch) (or single example).

Net::update
virtual void update()=0
Run a single update of the network.

Net::SGDParams::seed
long seed
seed for random number generator used to initialise weights and also perform shuffling ...
Definition: net.hpp:272

Net::getDataSize
virtual int getDataSize() const =0
Get the length of the serialised data block for this network.

Net::load
virtual void load(double *buf)=0
Given that the pointer points to a data block of the correct size for the current network...

Net::SGDParams::iterations
int iterations
number of iterations to run: an iteration is the presentation of a single example, NOT an epoch (or occasionally pair-presentation) as is the case in the thesis when discussing the modulatory network types.
Definition: net.hpp:181

Net::SGDParams::nSlices
int nSlices
The number of cross-validation slices to use.
Definition: net.hpp:192

Net::type
NetType type
type of the network, used for load/save
Definition: net.hpp:49

Net::rd
drand48_data rd
PRNG data (thread safe)
Definition: net.hpp:50

Net::SGDParams::setShuffle
SGDParams & setShuffle(ExampleSet::ShuffleMode m)
fluent setter for preserveHAlternation
Definition: net.hpp:224

Net::SGDParams::cvShuffle
bool cvShuffle
if true, shuffle the entire CV data set when all slices have been done so that the cross-validation h...
Definition: net.hpp:249

Net::SGDParams::SGDParams
SGDParams(double _eta, const ExampleSet &examples, int _iters)
Definition: net.hpp:332

Net::setSeed
void setSeed(long seed)
Set this network&#39;s random number generator, which is used for weight initialisation done at the start...
Definition: net.hpp:57

ExampleSet::getH
double getH(int example) const
Get the h (modulator) for a given example.
Definition: data.hpp:359

Net::SGDParams::~SGDParams
~SGDParams()
Destructor.
Definition: net.hpp:340

Net::test
double test(ExampleSet &examples, int start=0, int num=-1)
Test a network. Runs the network over a set of examples and returns the mean MSE for all outputs  whe...
Definition: net.hpp:142

Net
The abstract network type upon which all others are based. It&#39;s not pure virtual, in that it encapsul...
Definition: net.hpp:39

ExampleSet::getInputs
double * getInputs(int example)
Get a pointer to the inputs for a given example, for reading or writing.
Definition: data.hpp:338

Net::drand
double drand(double mn, double mx)
get a random number using this net&#39;s PRNG data
Definition: net.hpp:591

ExampleSet
A set of example data. Each datum consists of hormone (i.e. modulator value), inputs and outputs...
Definition: data.hpp:57

Net::SGDParams::shuffleMode
ExampleSet::ShuffleMode shuffleMode
The shuffle mode to use - see the ExampleSet::ShuffleMode enum for details.
Definition: net.hpp:221