rootdoc/html/TMultiLayerPerceptron_8h_source.html

 // @(#)root/mlp:$Id$
 // Author: Christophe.Delaere@cern.ch   20/07/03

 /*************************************************************************
  * Copyright (C) 1995-2003, Rene Brun and Fons Rademakers.               *
  * All rights reserved.                                                  *
  *                                                                       *
  * For the licensing terms see $ROOTSYS/LICENSE.                         *
  * For the list of contributors see $ROOTSYS/README/CREDITS.             *
  *************************************************************************/

 #ifndef ROOT_TMultiLayerPerceptron
 #define ROOT_TMultiLayerPerceptron

 #include "TObject.h"
 #include "TString.h"
 #include "TObjArray.h"
 #include "TMatrixD.h"
 #include "TNeuron.h"

 class TTree;
 class TEventList;
 class TTreeFormula;
 class TTreeFormulaManager;

 //____________________________________________________________________
 //
 // TMultiLayerPerceptron
 //
 // This class decribes a Neural network.
 // There are facilities to train the network and use the output.
 //
 // The input layer is made of inactive neurons (returning the
 // normalized input), hidden layers are made of sigmoids and output
 // neurons are linear.
 //
 // The basic input is a TTree and two (training and test) TEventLists.
 // For classification jobs, a branch (maybe in a TFriend) must contain
 // the expected output.
 // 6 learning methods are available: kStochastic, kBatch,
 // kSteepestDescent, kRibierePolak, kFletcherReeves and kBFGS.
 //
 // This implementation is *inspired* from the mlpfit package from
 // J.Schwindling et al.
 //
 //____________________________________________________________________

 class TMultiLayerPerceptron : public TObject {
  friend class TMLPAnalyzer;

  public:
    enum ELearningMethod { kStochastic, kBatch, kSteepestDescent,
                           kRibierePolak, kFletcherReeves, kBFGS };
    enum EDataSet { kTraining, kTest };
    TMultiLayerPerceptron();
    TMultiLayerPerceptron(const char* layout, TTree* data = 0,
                          const char* training = "Entry$%2==0",
                          const char* test = "",
                          TNeuron::ENeuronType type = TNeuron::kSigmoid,
                          const char* extF = "", const char* extD  = "");
    TMultiLayerPerceptron(const char* layout,
                          const char* weight, TTree* data = 0,
                          const char* training = "Entry$%2==0",
                          const char* test = "",
                          TNeuron::ENeuronType type = TNeuron::kSigmoid,
                          const char* extF = "", const char* extD  = "");
    TMultiLayerPerceptron(const char* layout, TTree* data,
                          TEventList* training,
                          TEventList* test,
                          TNeuron::ENeuronType type = TNeuron::kSigmoid,
                          const char* extF = "", const char* extD  = "");
    TMultiLayerPerceptron(const char* layout,
                          const char* weight, TTree* data,
                          TEventList* training,
                          TEventList* test,
                          TNeuron::ENeuronType type = TNeuron::kSigmoid,
                          const char* extF = "", const char* extD  = "");
    virtual ~TMultiLayerPerceptron();
    void SetData(TTree*);
    void SetTrainingDataSet(TEventList* train);
    void SetTestDataSet(TEventList* test);
    void SetTrainingDataSet(const char* train);
    void SetTestDataSet(const char* test);
    void SetLearningMethod(TMultiLayerPerceptron::ELearningMethod method);
    void SetEventWeight(const char*);
    void Train(Int_t nEpoch, Option_t* option = "text", Double_t minE=0);
    Double_t Result(Int_t event, Int_t index = 0) const;
    Double_t GetError(Int_t event) const;
    Double_t GetError(TMultiLayerPerceptron::EDataSet set) const;
    void ComputeDEDw() const;
    void Randomize() const;
    void SetEta(Double_t eta);
    void SetEpsilon(Double_t eps);
    void SetDelta(Double_t delta);
    void SetEtaDecay(Double_t ed);
    void SetTau(Double_t tau);
    void SetReset(Int_t reset);
    inline Double_t GetEta()      const { return fEta; }
    inline Double_t GetEpsilon()  const { return fEpsilon; }
    inline Double_t GetDelta()    const { return fDelta; }
    inline Double_t GetEtaDecay() const { return fEtaDecay; }
    TMultiLayerPerceptron::ELearningMethod GetLearningMethod() const { return fLearningMethod; }
    inline Double_t GetTau()      const { return fTau; }
    inline Int_t GetReset()       const { return fReset; }
    inline TString GetStructure() const { return fStructure; }
    inline TNeuron::ENeuronType GetType() const { return fType; }
    void DrawResult(Int_t index = 0, Option_t* option = "test") const;
    Bool_t DumpWeights(Option_t* filename = "-") const;
    Bool_t LoadWeights(Option_t* filename = "");
    Double_t Evaluate(Int_t index, Double_t* params) const;
    void Export(Option_t* filename = "NNfunction", Option_t* language = "C++") const;
    virtual void Draw(Option_t *option="");

  protected:
    void AttachData();
    void BuildNetwork();
    void GetEntry(Int_t) const;
    // it's a choice not to force learning function being const, even if possible
    void MLP_Stochastic(Double_t*);
    void MLP_Batch(Double_t*);
    Bool_t LineSearch(Double_t*, Double_t*);
    void SteepestDir(Double_t*);
    void ConjugateGradientsDir(Double_t*, Double_t);
    void SetGammaDelta(TMatrixD&, TMatrixD&, Double_t*);
    bool GetBFGSH(TMatrixD&, TMatrixD &, TMatrixD&);
    void BFGSDir(TMatrixD&, Double_t*);
    Double_t DerivDir(Double_t*);
    Double_t GetCrossEntropyBinary() const;
    Double_t GetCrossEntropy() const;
    Double_t GetSumSquareError() const;

  private:
    TMultiLayerPerceptron(const TMultiLayerPerceptron&); // Not implemented
    TMultiLayerPerceptron& operator=(const TMultiLayerPerceptron&); // Not implemented
    void ExpandStructure();
    void BuildFirstLayer(TString&);
    void BuildHiddenLayers(TString&);
    void BuildOneHiddenLayer(const TString& sNumNodes, Int_t& layer,
                             Int_t& prevStart, Int_t& prevStop,
                             Bool_t lastLayer);
    void BuildLastLayer(TString&, Int_t);
    void Shuffle(Int_t*, Int_t) const;
    void MLP_Line(Double_t*, Double_t*, Double_t);

    TTree* fData;                   //! pointer to the tree used as datasource
    Int_t fCurrentTree;             //! index of the current tree in a chain
    Double_t fCurrentTreeWeight;    //! weight of the current tree in a chain
    TObjArray fNetwork;             // Collection of all the neurons in the network
    TObjArray fFirstLayer;          // Collection of the input neurons; subset of fNetwork
    TObjArray fLastLayer;           // Collection of the output neurons; subset of fNetwork
    TObjArray fSynapses;            // Collection of all the synapses in the network
    TString fStructure;             // String containing the network structure
    TString fWeight;                // String containing the event weight
    TNeuron::ENeuronType fType;     // Type of hidden neurons
    TNeuron::ENeuronType fOutType;  // Type of output neurons
    TString fextF;                  // String containing the function name
    TString fextD;                  // String containing the derivative name
    TEventList *fTraining;          //! EventList defining the events in the training dataset
    TEventList *fTest;              //! EventList defining the events in the test dataset
    ELearningMethod fLearningMethod; //! The Learning Method
    TTreeFormula* fEventWeight;     //! formula representing the event weight
    TTreeFormulaManager* fManager;  //! TTreeFormulaManager for the weight and neurons
    Double_t fEta;                  //! Eta - used in stochastic minimisation - Default=0.1
    Double_t fEpsilon;              //! Epsilon - used in stochastic minimisation - Default=0.
    Double_t fDelta;                //! Delta - used in stochastic minimisation - Default=0.
    Double_t fEtaDecay;             //! EtaDecay - Eta *= EtaDecay at each epoch - Default=1.
    Double_t fTau;                  //! Tau - used in line search - Default=3.
    Double_t fLastAlpha;            //! internal parameter used in line search
    Int_t fReset;                   //! number of epochs between two resets of the search direction to the steepest descent - Default=50
    Bool_t fTrainingOwner;          //! internal flag whether one has to delete fTraining or not
    Bool_t fTestOwner;              //! internal flag whether one has to delete fTest or not
    ClassDef(TMultiLayerPerceptron, 4) // a Neural Network
 };

 #endif
TMultiLayerPerceptron::DerivDir
Double_t DerivDir(Double_t *)
scalar product between gradient and direction = derivative along direction
Definition: TMultiLayerPerceptron.cxx:2415

TMultiLayerPerceptron::kStochastic
Definition: TMultiLayerPerceptron.h:52

TMultiLayerPerceptron
Definition: TMultiLayerPerceptron.h:48

TMultiLayerPerceptron::fFirstLayer
TObjArray fFirstLayer
Definition: TMultiLayerPerceptron.h:149

TMultiLayerPerceptron::LineSearch
Bool_t LineSearch(Double_t *, Double_t *)
Search along the line defined by direction.
Definition: TMultiLayerPerceptron.cxx:2221

TMultiLayerPerceptron::SteepestDir
void SteepestDir(Double_t *)
Sets the search direction to steepest descent.
Definition: TMultiLayerPerceptron.cxx:2200

TMultiLayerPerceptron::Randomize
void Randomize() const
Randomize the weights.
Definition: TMultiLayerPerceptron.cxx:1189

TMultiLayerPerceptron::BuildHiddenLayers
void BuildHiddenLayers(TString &)
Builds hidden layers.
Definition: TMultiLayerPerceptron.cxx:1369

TNeuron.h

TMultiLayerPerceptron::BFGSDir
void BFGSDir(TMatrixD &, Double_t *)
Computes the direction for the BFGS algorithm as the product between the Hessian estimate (bfgsh) and...
Definition: TMultiLayerPerceptron.cxx:2439

TMultiLayerPerceptron::fEpsilon
Double_t fEpsilon
Eta - used in stochastic minimisation - Default=0.1.
Definition: TMultiLayerPerceptron.h:164

TMultiLayerPerceptron::fManager
TTreeFormulaManager * fManager
formula representing the event weight
Definition: TMultiLayerPerceptron.h:162

TMultiLayerPerceptron::ELearningMethod
ELearningMethod
Definition: TMultiLayerPerceptron.h:52

TMultiLayerPerceptron::fData
TTree * fData
Definition: TMultiLayerPerceptron.h:145

TMultiLayerPerceptron::SetTestDataSet
void SetTestDataSet(TEventList *test)
Sets the Test dataset.
Definition: TMultiLayerPerceptron.cxx:589

TMultiLayerPerceptron::kTest
Definition: TMultiLayerPerceptron.h:54

TMultiLayerPerceptron::GetEpsilon
Double_t GetEpsilon() const
Definition: TMultiLayerPerceptron.h:99

TMultiLayerPerceptron::fCurrentTreeWeight
Double_t fCurrentTreeWeight
index of the current tree in a chain
Definition: TMultiLayerPerceptron.h:147

TMultiLayerPerceptron::SetEpsilon
void SetEpsilon(Double_t eps)
Sets Epsilon - used in stochastic minimisation (look at the constructor for the complete description ...
Definition: TMultiLayerPerceptron.cxx:660

TMultiLayerPerceptron::Export
void Export(Option_t *filename="NNfunction", Option_t *language="C++") const
Exports the NN as a function for any non-ROOT-dependant code Supported languages are: only C++ ...
Definition: TMultiLayerPerceptron.cxx:1688

TMultiLayerPerceptron::Evaluate
Double_t Evaluate(Int_t index, Double_t *params) const
Returns the Neural Net for a given set of input parameters #parameters must equal #input neurons...
Definition: TMultiLayerPerceptron.cxx:1663

TNeuron::ENeuronType
ENeuronType
Definition: TNeuron.h:48

TMultiLayerPerceptron::AttachData
void AttachData()
Connects the TTree to Neurons in input and output layers.
Definition: TMultiLayerPerceptron.cxx:1216

TMultiLayerPerceptron::SetEtaDecay
void SetEtaDecay(Double_t ed)
Sets EtaDecay - Eta *= EtaDecay at each epoch (look at the constructor for the complete description o...
Definition: TMultiLayerPerceptron.cxx:680

TMultiLayerPerceptron::kSteepestDescent
Definition: TMultiLayerPerceptron.h:52

TMultiLayerPerceptron::SetEta
void SetEta(Double_t eta)
Sets Eta - used in stochastic minimisation (look at the constructor for the complete description of l...
Definition: TMultiLayerPerceptron.cxx:650

TMultiLayerPerceptron::GetEta
Double_t GetEta() const
Definition: TMultiLayerPerceptron.h:98

TMultiLayerPerceptron::GetLearningMethod
TMultiLayerPerceptron::ELearningMethod GetLearningMethod() const
Definition: TMultiLayerPerceptron.h:102

TMultiLayerPerceptron::SetData
void SetData(TTree *)
Set the data source.
Definition: TMultiLayerPerceptron.cxx:546

TNeuron::kSigmoid
Definition: TNeuron.h:48

TMultiLayerPerceptron::Shuffle
void Shuffle(Int_t *, Int_t) const
Shuffle the Int_t index[n] in input.
Definition: TMultiLayerPerceptron.cxx:2086

TMultiLayerPerceptron::GetSumSquareError
Double_t GetSumSquareError() const
Error on the output for a given event.
Definition: TMultiLayerPerceptron.cxx:1048

TMultiLayerPerceptron::fNetwork
TObjArray fNetwork
weight of the current tree in a chain
Definition: TMultiLayerPerceptron.h:148

TMultiLayerPerceptron::GetTau
Double_t GetTau() const
Definition: TMultiLayerPerceptron.h:103

TMLPAnalyzer
Definition: TMLPAnalyzer.h:36

TMatrixT< Double_t >

TMultiLayerPerceptron::ConjugateGradientsDir
void ConjugateGradientsDir(Double_t *, Double_t)
Sets the search direction to conjugate gradient direction beta should be: ||g_{(t+1)}||^2 / ||g_{(t)}...
Definition: TMultiLayerPerceptron.cxx:2324

TMultiLayerPerceptron::DrawResult
void DrawResult(Int_t index=0, Option_t *option="test") const
Draws the neural net output It produces an histogram with the output for the two datasets.
Definition: TMultiLayerPerceptron.cxx:1483

TMultiLayerPerceptron::GetBFGSH
bool GetBFGSH(TMatrixD &, TMatrixD &, TMatrixD &)
Computes the hessian matrix using the BFGS update algorithm.
Definition: TMultiLayerPerceptron.cxx:2350

TMultiLayerPerceptron::fEta
Double_t fEta
TTreeFormulaManager for the weight and neurons.
Definition: TMultiLayerPerceptron.h:163

tau
you should not use this method at all Int_t Int_t Double_t Double_t Double_t Int_t Double_t Double_t Double_t tau
Definition: TRolke.cxx:630

TMultiLayerPerceptron::fextF
TString fextF
Definition: TMultiLayerPerceptron.h:156

TMultiLayerPerceptron::operator=
TMultiLayerPerceptron & operator=(const TMultiLayerPerceptron &)

TMultiLayerPerceptron::~TMultiLayerPerceptron
virtual ~TMultiLayerPerceptron()
Destructor.
Definition: TMultiLayerPerceptron.cxx:537

TMultiLayerPerceptron::SetReset
void SetReset(Int_t reset)
Sets number of epochs between two resets of the search direction to the steepest descent.
Definition: TMultiLayerPerceptron.cxx:701

TMultiLayerPerceptron::DumpWeights
Bool_t DumpWeights(Option_t *filename="-") const
Dumps the weights to a text file.
Definition: TMultiLayerPerceptron.cxx:1557

TMultiLayerPerceptron::fCurrentTree
Int_t fCurrentTree
pointer to the tree used as datasource
Definition: TMultiLayerPerceptron.h:146

TMultiLayerPerceptron::fType
TNeuron::ENeuronType fType
Definition: TMultiLayerPerceptron.h:154

TMultiLayerPerceptron::fSynapses
TObjArray fSynapses
Definition: TMultiLayerPerceptron.h:151

TMultiLayerPerceptron::fTraining
TEventList * fTraining
Definition: TMultiLayerPerceptron.h:158

TMultiLayerPerceptron::BuildOneHiddenLayer
void BuildOneHiddenLayer(const TString &sNumNodes, Int_t &layer, Int_t &prevStart, Int_t &prevStop, Bool_t lastLayer)
Builds a hidden layer, updates the number of layers.
Definition: TMultiLayerPerceptron.cxx:1388

TMultiLayerPerceptron::Train
void Train(Int_t nEpoch, Option_t *option="text", Double_t minE=0)
Train the network.
Definition: TMultiLayerPerceptron.cxx:738

TMultiLayerPerceptron::fOutType
TNeuron::ENeuronType fOutType
Definition: TMultiLayerPerceptron.h:155

TMultiLayerPerceptron::Draw
virtual void Draw(Option_t *option="")
Draws the network structure.
Definition: TMultiLayerPerceptron.cxx:2469

TMultiLayerPerceptron::fTestOwner
Bool_t fTestOwner
internal flag whether one has to delete fTraining or not
Definition: TMultiLayerPerceptron.h:171

TMultiLayerPerceptron::GetError
Double_t GetError(Int_t event) const
Error on the output for a given event.
Definition: TMultiLayerPerceptron.cxx:996

TMultiLayerPerceptron::LoadWeights
Bool_t LoadWeights(Option_t *filename="")
Loads the weights from a text file conforming to the format defined by DumpWeights.
Definition: TMultiLayerPerceptron.cxx:1607

TMultiLayerPerceptron::fReset
Int_t fReset
internal parameter used in line search
Definition: TMultiLayerPerceptron.h:169

TMultiLayerPerceptron::SetTrainingDataSet
void SetTrainingDataSet(TEventList *train)
Sets the Training dataset.
Definition: TMultiLayerPerceptron.cxx:578

TMultiLayerPerceptron::kBatch
Definition: TMultiLayerPerceptron.h:52

TMultiLayerPerceptron::GetReset
Int_t GetReset() const
Definition: TMultiLayerPerceptron.h:104

TMultiLayerPerceptron::SetGammaDelta
void SetGammaDelta(TMatrixD &, TMatrixD &, Double_t *)
Sets the gamma (g_{(t+1)}-g_{(t)}) and delta (w_{(t+1)}-w_{(t)}) vectors Gamma is computed here...
Definition: TMultiLayerPerceptron.cxx:2376

TMultiLayerPerceptron::ComputeDEDw
void ComputeDEDw() const
Compute the DEDw = sum on all training events of dedw for each weight normalized by the number of eve...
Definition: TMultiLayerPerceptron.cxx:1113

TMultiLayerPerceptron::kRibierePolak
Definition: TMultiLayerPerceptron.h:53

TMultiLayerPerceptron::fEtaDecay
Double_t fEtaDecay
Delta - used in stochastic minimisation - Default=0.
Definition: TMultiLayerPerceptron.h:166

TMultiLayerPerceptron::fDelta
Double_t fDelta
Epsilon - used in stochastic minimisation - Default=0.
Definition: TMultiLayerPerceptron.h:165

TMultiLayerPerceptron::SetDelta
void SetDelta(Double_t delta)
Sets Delta - used in stochastic minimisation (look at the constructor for the complete description of...
Definition: TMultiLayerPerceptron.cxx:670

TMultiLayerPerceptron::fWeight
TString fWeight
Definition: TMultiLayerPerceptron.h:153

TMultiLayerPerceptron::fTau
Double_t fTau
EtaDecay - Eta *= EtaDecay at each epoch - Default=1.
Definition: TMultiLayerPerceptron.h:167

TMultiLayerPerceptron::MLP_Line
void MLP_Line(Double_t *, Double_t *, Double_t)
Sets the weights to a point along a line Weights are set to [origin + (dist * dir)].
Definition: TMultiLayerPerceptron.cxx:2178

TMultiLayerPerceptron::kBFGS
Definition: TMultiLayerPerceptron.h:53

TMultiLayerPerceptron::fTest
TEventList * fTest
EventList defining the events in the training dataset.
Definition: TMultiLayerPerceptron.h:159

TMultiLayerPerceptron::MLP_Batch
void MLP_Batch(Double_t *)
One step for the batch (stochastic) method.
Definition: TMultiLayerPerceptron.cxx:2150

TMultiLayerPerceptron::fLearningMethod
ELearningMethod fLearningMethod
EventList defining the events in the test dataset.
Definition: TMultiLayerPerceptron.h:160

TMatrixD.h

TMultiLayerPerceptron::fLastLayer
TObjArray fLastLayer
Definition: TMultiLayerPerceptron.h:150

TMultiLayerPerceptron::MLP_Stochastic
void MLP_Stochastic(Double_t *)
One step for the stochastic method buffer should contain the previous dw vector and will be updated...
Definition: TMultiLayerPerceptron.cxx:2105

TMultiLayerPerceptron::GetEtaDecay
Double_t GetEtaDecay() const
Definition: TMultiLayerPerceptron.h:101

TMultiLayerPerceptron::fTrainingOwner
Bool_t fTrainingOwner
number of epochs between two resets of the search direction to the steepest descent - Default=50 ...
Definition: TMultiLayerPerceptron.h:170

TMultiLayerPerceptron::kTraining
Definition: TMultiLayerPerceptron.h:54

TMultiLayerPerceptron::GetCrossEntropyBinary
Double_t GetCrossEntropyBinary() const
Cross entropy error for sigmoid output neurons, for a given event.
Definition: TMultiLayerPerceptron.cxx:1061

TMultiLayerPerceptron::fStructure
TString fStructure
Definition: TMultiLayerPerceptron.h:152

TMultiLayerPerceptron::ExpandStructure
void ExpandStructure()
Expand the structure of the first layer.
Definition: TMultiLayerPerceptron.cxx:1274

TMultiLayerPerceptron::TMultiLayerPerceptron
TMultiLayerPerceptron()
Default constructor.
Definition: TMultiLayerPerceptron.cxx:252

TMultiLayerPerceptron::BuildFirstLayer
void BuildFirstLayer(TString &)
Instanciates the neurons in input Inputs are normalised and the type is set to kOff (simple forward o...
Definition: TMultiLayerPerceptron.cxx:1351

TMultiLayerPerceptron::SetEventWeight
void SetEventWeight(const char *)
Set the event weight.
Definition: TMultiLayerPerceptron.cxx:562

TMultiLayerPerceptron::GetEntry
void GetEntry(Int_t) const
Load an entry into the network.
Definition: TMultiLayerPerceptron.cxx:709

TMultiLayerPerceptron::fLastAlpha
Double_t fLastAlpha
Tau - used in line search - Default=3.
Definition: TMultiLayerPerceptron.h:168

TMultiLayerPerceptron::Result
Double_t Result(Int_t event, Int_t index=0) const
Computes the output for a given event.
Definition: TMultiLayerPerceptron.cxx:983

TMultiLayerPerceptron::GetCrossEntropy
Double_t GetCrossEntropy() const
Cross entropy error for a softmax output neuron, for a given event.
Definition: TMultiLayerPerceptron.cxx:1092

TMultiLayerPerceptron::BuildLastLayer
void BuildLastLayer(TString &, Int_t)
Builds the output layer Neurons are linear combinations of input, by defaul.
Definition: TMultiLayerPerceptron.cxx:1433

TMultiLayerPerceptron::SetLearningMethod
void SetLearningMethod(TMultiLayerPerceptron::ELearningMethod method)
Sets the learning method.
Definition: TMultiLayerPerceptron.cxx:640

TMultiLayerPerceptron::SetTau
void SetTau(Double_t tau)
Sets Tau - used in line search (look at the constructor for the complete description of learning meth...
Definition: TMultiLayerPerceptron.cxx:690

TMultiLayerPerceptron::BuildNetwork
void BuildNetwork()
Instanciates the network from the description.
Definition: TMultiLayerPerceptron.cxx:1320

TMultiLayerPerceptron::kFletcherReeves
Definition: TMultiLayerPerceptron.h:53

TMultiLayerPerceptron::EDataSet
EDataSet
Definition: TMultiLayerPerceptron.h:54

TMultiLayerPerceptron::GetType
TNeuron::ENeuronType GetType() const
Definition: TMultiLayerPerceptron.h:106

TMultiLayerPerceptron::GetDelta
Double_t GetDelta() const
Definition: TMultiLayerPerceptron.h:100

TMultiLayerPerceptron::fextD
TString fextD
Definition: TMultiLayerPerceptron.h:157

TMultiLayerPerceptron::GetStructure
TString GetStructure() const
Definition: TMultiLayerPerceptron.h:105

TMultiLayerPerceptron::fEventWeight
TTreeFormula * fEventWeight
The Learning Method.
Definition: TMultiLayerPerceptron.h:161