doc/v616/MethodMLP_8h_source.html

// @(#)root/tmva $Id$

// Author: Krzysztof Danielowski, Andreas Hoecker, Matt Jachowski, Kamil Kraszewski, Maciej Kruk, Peter Speckmayer, Joerg Stelzer, Eckhard von Toerne, Jan Therhaag, Jiahang Zhong


/**********************************************************************************

 * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

 * Package: TMVA                                                                  *

 * Class  : MethodMLP                                                             *

 * Web    : http://tmva.sourceforge.net                                           *

 *                                                                                *

 * Description:                                                                   *

 *      ANN Multilayer Perceptron  class for the discrimination of signal         *

 *      from background.  BFGS implementation based on TMultiLayerPerceptron      *

 *      class from ROOT (http://root.cern.ch).                                    *

 *                                                                                *

 * Authors (alphabetical):                                                        *

 *      Krzysztof Danielowski <danielow@cern.ch>       - IFJ & AGH, Poland        *

 *      Andreas Hoecker       <Andreas.Hocker@cern.ch> - CERN, Switzerland        *

 *      Matt Jachowski        <jachowski@stanford.edu> - Stanford University, USA *

 *      Kamil Kraszewski      <kalq@cern.ch>           - IFJ & UJ, Poland         *

 *      Maciej Kruk           <mkruk@cern.ch>          - IFJ & AGH, Poland        *

 *      Peter Speckmayer      <peter.speckmayer@cern.ch> - CERN, Switzerland      *

 *      Joerg Stelzer         <stelzer@cern.ch>        - DESY, Germany            *

 *      Jan Therhaag          <Jan.Therhaag@cern.ch>   - U of Bonn, Germany       *

 *      Eckhard v. Toerne     <evt@uni-bonn.de>        - U of Bonn, Germany       *

 *      Jiahang Zhong         <Jiahang.Zhong@cern.ch>  - Academia Sinica, Taipei  *

 *                                                                                *

 * Copyright (c) 2005-2011:                                                       *

 *      CERN, Switzerland                                                         *

 *      U. of Victoria, Canada                                                    *

 *      MPI-K Heidelberg, Germany                                                 *

 *      U. of Bonn, Germany                                                       *

 *                                                                                *

 * Redistribution and use in source and binary forms, with or without             *

 * modification, are permitted according to the terms listed in LICENSE           *

 * (http://tmva.sourceforge.net/LICENSE)                                          *

 **********************************************************************************/


#ifndef ROOT_TMVA_MethodMLP

#define ROOT_TMVA_MethodMLP


//////////////////////////////////////////////////////////////////////////

//                                                                      //

// MethodMLP                                                            //

//                                                                      //

// Multilayer Perceptron built off of MethodANNBase                     //

//                                                                      //

//////////////////////////////////////////////////////////////////////////


#include <vector>

#include "TString.h"

#include "TTree.h"

#include "TObjArray.h"

#include "TRandom3.h"

#include "TH1F.h"

#include "TMatrixDfwd.h"


#include "TMVA/IFitterTarget.h"

#include "TMVA/MethodBase.h"

#include "TMVA/MethodANNBase.h"

#include "TMVA/TNeuron.h"

#include "TMVA/TActivation.h"

#include "TMVA/ConvergenceTest.h"


#define MethodMLP_UseMinuit__

#undef  MethodMLP_UseMinuit__


namespace TMVA {


   class MethodMLP : public MethodANNBase, public IFitterTarget, public ConvergenceTest {


   public:


      // standard constructors

      MethodMLP( const TString& jobName,

                 const TString&  methodTitle,

                 DataSetInfo& theData,

                 const TString& theOption );


      MethodMLP( DataSetInfo& theData,

                 const TString& theWeightFile );


      virtual ~MethodMLP();


      virtual Bool_t HasAnalysisType( Types::EAnalysisType type, UInt_t numberClasses, UInt_t numberTargets );


      void Train();

      // for GA

      Double_t ComputeEstimator ( std::vector<Double_t>& parameters );

      Double_t EstimatorFunction( std::vector<Double_t>& parameters );


      enum ETrainingMethod { kBP=0, kBFGS, kGA };

      enum EBPTrainingMode { kSequential=0, kBatch };


      bool     HasInverseHessian() { return fCalculateErrors; }

      Double_t GetMvaValue( Double_t* err=0, Double_t* errUpper=0 );


   protected:


      // make ROOT-independent C++ class for classifier response (classifier-specific implementation)

      void MakeClassSpecific( std::ostream&, const TString& ) const;


      // get help message text

      void GetHelpMessage() const;


   private:


      // the option handling methods

      void DeclareOptions();

      void ProcessOptions();


      // general helper functions

      void     Train( Int_t nEpochs );

      void     Init();

      void     InitializeLearningRates(); // although this is only needed by backprop


      // used as a measure of success in all minimization techniques

      Double_t CalculateEstimator( Types::ETreeType treeType = Types::kTraining, Int_t iEpoch = -1 );


      // BFGS functions

      void     BFGSMinimize( Int_t nEpochs );

      void     SetGammaDelta( TMatrixD &Gamma, TMatrixD &Delta, std::vector<Double_t> &Buffer );

      void     SteepestDir( TMatrixD &Dir );

      Bool_t   GetHessian( TMatrixD &Hessian, TMatrixD &Gamma, TMatrixD &Delta );

      void     SetDir( TMatrixD &Hessian, TMatrixD &Dir );

      Double_t DerivDir( TMatrixD &Dir );

      Bool_t   LineSearch( TMatrixD &Dir, std::vector<Double_t> &Buffer, Double_t* dError=0 ); //zjh

      void     ComputeDEDw();

      void     SimulateEvent( const Event* ev );

      void     SetDirWeights( std::vector<Double_t> &Origin, TMatrixD &Dir, Double_t alpha );

      Double_t GetError();

      Double_t GetMSEErr( const Event* ev, UInt_t index = 0 );   //zjh

      Double_t GetCEErr( const Event* ev, UInt_t index = 0 );   //zjh


      // backpropagation functions

      void     BackPropagationMinimize( Int_t nEpochs );

      void     TrainOneEpoch();

      void     Shuffle( Int_t* index, Int_t n );

      void     DecaySynapseWeights(Bool_t lateEpoch );

      void     TrainOneEvent( Int_t ievt);

      Double_t GetDesiredOutput( const Event* ev );

      void     UpdateNetwork( Double_t desired, Double_t eventWeight=1.0 );

      void     UpdateNetwork(const std::vector<Float_t>& desired, Double_t eventWeight=1.0);

      void     CalculateNeuronDeltas();

      void     UpdateSynapses();

      void     AdjustSynapseWeights();


      // faster backpropagation

      void     TrainOneEventFast( Int_t ievt, Float_t*& branchVar, Int_t& type );


      // genetic algorithm functions

      void GeneticMinimize();


#ifdef MethodMLP_UseMinuit__

      // minuit functions -- commented out because they rely on a static pointer

      void MinuitMinimize();

      static MethodMLP* GetThisPtr();

      static void IFCN( Int_t& npars, Double_t* grad, Double_t &f, Double_t* fitPars, Int_t ifl );

      void FCN( Int_t& npars, Double_t* grad, Double_t &f, Double_t* fitPars, Int_t ifl );

#endif


      // general

      bool               fUseRegulator;         // zjh

      bool               fCalculateErrors;      // compute inverse hessian matrix at the end of the training

      Double_t           fPrior;                // zjh

      std::vector<Double_t> fPriorDev;          // zjh

      void               GetApproxInvHessian ( TMatrixD& InvHessian, bool regulate=true );   //rank-1 approximation, neglect 2nd derivatives. //zjh

      void               UpdateRegulators();    // zjh

      void               UpdatePriors();        // zjh

      Int_t              fUpdateLimit;          // zjh


      ETrainingMethod fTrainingMethod; // method of training, BP or GA

      TString         fTrainMethodS;   // training method option param


      Float_t         fSamplingFraction;  // fraction of events which is sampled for training

      Float_t         fSamplingEpoch;     // fraction of epochs where sampling is used

      Float_t         fSamplingWeight;    // changing factor for event weights when sampling is turned on

      Bool_t          fSamplingTraining;  // The training sample is sampled

      Bool_t          fSamplingTesting;   // The testing sample is sampled


      // BFGS variables

      Double_t        fLastAlpha;      // line search variable

      Double_t        fTau;            // line search variable

      Int_t           fResetStep;      // reset time (how often we clear hessian matrix)


      // back propagation variable

      Double_t        fLearnRate;      // learning rate for synapse weight adjustments

      Double_t        fDecayRate;      // decay rate for above learning rate

      EBPTrainingMode fBPMode;         // backprop learning mode (sequential or batch)

      TString         fBpModeS;        // backprop learning mode option string (sequential or batch)

      Int_t           fBatchSize;      // batch size, only matters if in batch learning mode

      Int_t           fTestRate;       // test for overtraining performed at each #th epochs

      Bool_t          fEpochMon;       // create and fill epoch-wise monitoring histograms (makes outputfile big!)


      // genetic algorithm variables

      Int_t           fGA_nsteps;      // GA settings: number of steps

      Int_t           fGA_preCalc;     // GA settings: number of pre-calc steps

      Int_t           fGA_SC_steps;    // GA settings: SC_steps

      Int_t           fGA_SC_rate; // GA settings: SC_rate

      Double_t        fGA_SC_factor;   // GA settings: SC_factor


      // regression, storage of deviations

      std::vector<std::pair<Float_t,Float_t> >* fDeviationsFromTargets; // deviation from the targets, event weight


      Float_t         fWeightRange;    // suppress outliers for the estimator calculation


#ifdef MethodMLP_UseMinuit__

      // minuit variables -- commented out because they rely on a static pointer

      Int_t          fNumberOfWeights; // Minuit: number of weights

      static MethodMLP* fgThis;        // Minuit: this pointer

#endif


      // debugging flags

      static const Int_t  fgPRINT_ESTIMATOR_INC = 10;     // debug flags

      static const Bool_t fgPRINT_SEQ           = kFALSE; // debug flags

      static const Bool_t fgPRINT_BATCH         = kFALSE; // debug flags


      ClassDef(MethodMLP,0); // Multi-layer perceptron implemented specifically for TMVA

   };


} // namespace TMVA


#endif

ConvergenceTest.h

IFitterTarget.h

MethodANNBase.h

MethodBase.h

f
#define f(i)
Definition: RSha256.hxx:104

Int_t
int Int_t
Definition: RtypesCore.h:41

UInt_t
unsigned int UInt_t
Definition: RtypesCore.h:42

kFALSE
const Bool_t kFALSE
Definition: RtypesCore.h:88

Bool_t
bool Bool_t
Definition: RtypesCore.h:59

Double_t
double Double_t
Definition: RtypesCore.h:55

Float_t
float Float_t
Definition: RtypesCore.h:53

ClassDef
#define ClassDef(name, id)
Definition: Rtypes.h:324

TActivation.h

type
int type
Definition: TGX11.cxx:120

TH1F.h

TMatrixDfwd.h

TObjArray.h

TRandom3.h

TString.h

TTree.h

TMVA::ConvergenceTest
Check for convergence.
Definition: ConvergenceTest.h:46

TMVA::DataSetInfo
Class that contains all the data information.
Definition: DataSetInfo.h:60

TMVA::Event
Definition: Event.h:52

TMVA::IFitterTarget
Interface for a fitter 'target'.
Definition: IFitterTarget.h:44

TMVA::MethodANNBase
Base class for all TMVA methods using artificial neural networks.
Definition: MethodANNBase.h:62

TMVA::MethodMLP
Multilayer Perceptron class built off of MethodANNBase.
Definition: MethodMLP.h:69

TMVA::MethodMLP::fResetStep
Int_t fResetStep
Definition: MethodMLP.h:185

TMVA::MethodMLP::fCalculateErrors
bool fCalculateErrors
Definition: MethodMLP.h:165

TMVA::MethodMLP::fDeviationsFromTargets
std::vector< std::pair< Float_t, Float_t > > * fDeviationsFromTargets
Definition: MethodMLP.h:204

TMVA::MethodMLP::LineSearch
Bool_t LineSearch(TMatrixD &Dir, std::vector< Double_t > &Buffer, Double_t *dError=0)
Definition: MethodMLP.cxx:844

TMVA::MethodMLP::fTau
Double_t fTau
Definition: MethodMLP.h:184

TMVA::MethodMLP::fGA_SC_rate
Int_t fGA_SC_rate
Definition: MethodMLP.h:200

TMVA::MethodMLP::fWeightRange
Float_t fWeightRange
Definition: MethodMLP.h:206

TMVA::MethodMLP::fSamplingWeight
Float_t fSamplingWeight
Definition: MethodMLP.h:178

TMVA::MethodMLP::fBatchSize
Int_t fBatchSize
Definition: MethodMLP.h:192

TMVA::MethodMLP::GetHelpMessage
void GetHelpMessage() const
get help message text
Definition: MethodMLP.cxx:1719

TMVA::MethodMLP::BackPropagationMinimize
void BackPropagationMinimize(Int_t nEpochs)
minimize estimator / train network with back propagation algorithm
Definition: MethodMLP.cxx:1041

TMVA::MethodMLP::GetMSEErr
Double_t GetMSEErr(const Event *ev, UInt_t index=0)
Definition: MethodMLP.cxx:1007

TMVA::MethodMLP::fUseRegulator
bool fUseRegulator
Definition: MethodMLP.h:164

TMVA::MethodMLP::GetMvaValue
Double_t GetMvaValue(Double_t *err=0, Double_t *errUpper=0)
get the mva value generated by the NN
Definition: MethodMLP.cxx:1553

TMVA::MethodMLP::MakeClassSpecific
void MakeClassSpecific(std::ostream &, const TString &) const
write specific classifier response
Definition: MethodMLP.cxx:1708

TMVA::MethodMLP::AdjustSynapseWeights
void AdjustSynapseWeights()
just adjust the synapse weights (should be called in batch mode)
Definition: MethodMLP.cxx:1438

TMVA::MethodMLP::fPriorDev
std::vector< Double_t > fPriorDev
Definition: MethodMLP.h:167

TMVA::MethodMLP::HasInverseHessian
bool HasInverseHessian()
Definition: MethodMLP.h:94

TMVA::MethodMLP::fBpModeS
TString fBpModeS
Definition: MethodMLP.h:191

TMVA::MethodMLP::SteepestDir
void SteepestDir(TMatrixD &Dir)
Definition: MethodMLP.cxx:778

TMVA::MethodMLP::TrainOneEpoch
void TrainOneEpoch()
train network over a single epoch/cycle of events
Definition: MethodMLP.cxx:1146

TMVA::MethodMLP::HasAnalysisType
virtual Bool_t HasAnalysisType(Types::EAnalysisType type, UInt_t numberClasses, UInt_t numberTargets)
MLP can handle classification with 2 classes and regression with one regression-target.
Definition: MethodMLP.cxx:154

TMVA::MethodMLP::fTrainMethodS
TString fTrainMethodS
Definition: MethodMLP.h:174

TMVA::MethodMLP::fGA_nsteps
Int_t fGA_nsteps
Definition: MethodMLP.h:197

TMVA::MethodMLP::fPrior
Double_t fPrior
Definition: MethodMLP.h:166

TMVA::MethodMLP::GetHessian
Bool_t GetHessian(TMatrixD &Hessian, TMatrixD &Gamma, TMatrixD &Delta)
Definition: MethodMLP.cxx:791

TMVA::MethodMLP::ComputeEstimator
Double_t ComputeEstimator(std::vector< Double_t > &parameters)
this function is called by GeneticANN for GA optimization
Definition: MethodMLP.cxx:1397

TMVA::MethodMLP::fUpdateLimit
Int_t fUpdateLimit
Definition: MethodMLP.h:171

TMVA::MethodMLP::fgPRINT_BATCH
static const Bool_t fgPRINT_BATCH
Definition: MethodMLP.h:217

TMVA::MethodMLP::InitializeLearningRates
void InitializeLearningRates()
initialize learning rates of synapses, used only by back propagation
Definition: MethodMLP.cxx:280

TMVA::MethodMLP::fGA_preCalc
Int_t fGA_preCalc
Definition: MethodMLP.h:198

TMVA::MethodMLP::CalculateNeuronDeltas
void CalculateNeuronDeltas()
have each neuron calculate its delta by back propagation
Definition: MethodMLP.cxx:1332

TMVA::MethodMLP::fTestRate
Int_t fTestRate
Definition: MethodMLP.h:193

TMVA::MethodMLP::fDecayRate
Double_t fDecayRate
Definition: MethodMLP.h:189

TMVA::MethodMLP::fTrainingMethod
ETrainingMethod fTrainingMethod
Definition: MethodMLP.h:173

TMVA::MethodMLP::fBPMode
EBPTrainingMode fBPMode
Definition: MethodMLP.h:190

TMVA::MethodMLP::DerivDir
Double_t DerivDir(TMatrixD &Dir)
Definition: MethodMLP.cxx:829

TMVA::MethodMLP::fGA_SC_factor
Double_t fGA_SC_factor
Definition: MethodMLP.h:201

TMVA::MethodMLP::GetCEErr
Double_t GetCEErr(const Event *ev, UInt_t index=0)
Definition: MethodMLP.cxx:1024

TMVA::MethodMLP::~MethodMLP
virtual ~MethodMLP()
destructor nothing to be done
Definition: MethodMLP.cxx:140

TMVA::MethodMLP::fGA_SC_steps
Int_t fGA_SC_steps
Definition: MethodMLP.h:199

TMVA::MethodMLP::SetDir
void SetDir(TMatrixD &Hessian, TMatrixD &Dir)
Definition: MethodMLP.cxx:812

TMVA::MethodMLP::Shuffle
void Shuffle(Int_t *index, Int_t n)
Input:
Definition: MethodMLP.cxx:1194

TMVA::MethodMLP::fSamplingTraining
Bool_t fSamplingTraining
Definition: MethodMLP.h:179

TMVA::MethodMLP::SimulateEvent
void SimulateEvent(const Event *ev)
Definition: MethodMLP.cxx:738

TMVA::MethodMLP::ETrainingMethod
ETrainingMethod
Definition: MethodMLP.h:91

TMVA::MethodMLP::kGA
@ kGA
Definition: MethodMLP.h:91

TMVA::MethodMLP::kBP
@ kBP
Definition: MethodMLP.h:91

TMVA::MethodMLP::kBFGS
@ kBFGS
Definition: MethodMLP.h:91

TMVA::MethodMLP::SetDirWeights
void SetDirWeights(std::vector< Double_t > &Origin, TMatrixD &Dir, Double_t alpha)
Definition: MethodMLP.cxx:954

TMVA::MethodMLP::SetGammaDelta
void SetGammaDelta(TMatrixD &Gamma, TMatrixD &Delta, std::vector< Double_t > &Buffer)
Definition: MethodMLP.cxx:676

TMVA::MethodMLP::Train
void Train()
Definition: MethodMLP.cxx:144

TMVA::MethodMLP::EstimatorFunction
Double_t EstimatorFunction(std::vector< Double_t > &parameters)
interface to the estimate
Definition: MethodMLP.cxx:1389

TMVA::MethodMLP::fLearnRate
Double_t fLearnRate
Definition: MethodMLP.h:188

TMVA::MethodMLP::UpdatePriors
void UpdatePriors()
Definition: MethodMLP.cxx:1458

TMVA::MethodMLP::GetApproxInvHessian
void GetApproxInvHessian(TMatrixD &InvHessian, bool regulate=true)
Definition: MethodMLP.cxx:1512

TMVA::MethodMLP::BFGSMinimize
void BFGSMinimize(Int_t nEpochs)
train network with BFGS algorithm
Definition: MethodMLP.cxx:491

TMVA::MethodMLP::UpdateSynapses
void UpdateSynapses()
update synapse error fields and adjust the weights (if in sequential mode)
Definition: MethodMLP.cxx:1416

TMVA::MethodMLP::Init
void Init()
default initializations
Definition: MethodMLP.cxx:166

TMVA::MethodMLP::fgPRINT_ESTIMATOR_INC
static const Int_t fgPRINT_ESTIMATOR_INC
Definition: MethodMLP.h:215

TMVA::MethodMLP::EBPTrainingMode
EBPTrainingMode
Definition: MethodMLP.h:92

TMVA::MethodMLP::kSequential
@ kSequential
Definition: MethodMLP.h:92

TMVA::MethodMLP::kBatch
@ kBatch
Definition: MethodMLP.h:92

TMVA::MethodMLP::ProcessOptions
void ProcessOptions()
process user options
Definition: MethodMLP.cxx:249

TMVA::MethodMLP::fSamplingFraction
Float_t fSamplingFraction
Definition: MethodMLP.h:176

TMVA::MethodMLP::TrainOneEvent
void TrainOneEvent(Int_t ievt)
train network over a single event this uses the new event model
Definition: MethodMLP.cxx:1262

TMVA::MethodMLP::GetDesiredOutput
Double_t GetDesiredOutput(const Event *ev)
get the desired output of this event
Definition: MethodMLP.cxx:1281

TMVA::MethodMLP::GeneticMinimize
void GeneticMinimize()
create genetics class similar to GeneticCut give it vector of parameter ranges (parameters = weights)...
Definition: MethodMLP.cxx:1360

TMVA::MethodMLP::fSamplingTesting
Bool_t fSamplingTesting
Definition: MethodMLP.h:180

TMVA::MethodMLP::GetError
Double_t GetError()
Definition: MethodMLP.cxx:970

TMVA::MethodMLP::fLastAlpha
Double_t fLastAlpha
Definition: MethodMLP.h:183

TMVA::MethodMLP::fSamplingEpoch
Float_t fSamplingEpoch
Definition: MethodMLP.h:177

TMVA::MethodMLP::DecaySynapseWeights
void DecaySynapseWeights(Bool_t lateEpoch)
decay synapse weights in last 10 epochs, lower learning rate even more to find a good minimum
Definition: MethodMLP.cxx:1212

TMVA::MethodMLP::TrainOneEventFast
void TrainOneEventFast(Int_t ievt, Float_t *&branchVar, Int_t &type)
fast per-event training
Definition: MethodMLP.cxx:1226

TMVA::MethodMLP::fEpochMon
Bool_t fEpochMon
Definition: MethodMLP.h:194

TMVA::MethodMLP::ComputeDEDw
void ComputeDEDw()
Definition: MethodMLP.cxx:701

TMVA::MethodMLP::UpdateNetwork
void UpdateNetwork(Double_t desired, Double_t eventWeight=1.0)
update the network based on how closely the output matched the desired output
Definition: MethodMLP.cxx:1290

TMVA::MethodMLP::MethodMLP
MethodMLP(const TString &jobName, const TString &methodTitle, DataSetInfo &theData, const TString &theOption)
standard constructor
Definition: MethodMLP.cxx:92

TMVA::MethodMLP::UpdateRegulators
void UpdateRegulators()
Definition: MethodMLP.cxx:1472

TMVA::MethodMLP::DeclareOptions
void DeclareOptions()
define the options (their key words) that can be set in the option string
Definition: MethodMLP.cxx:197

TMVA::MethodMLP::CalculateEstimator
Double_t CalculateEstimator(Types::ETreeType treeType=Types::kTraining, Int_t iEpoch=-1)
calculate the estimator that training is attempting to minimize
Definition: MethodMLP.cxx:294

TMVA::MethodMLP::fgPRINT_SEQ
static const Bool_t fgPRINT_SEQ
Definition: MethodMLP.h:216

TMVA::Types::EAnalysisType
EAnalysisType
Definition: Types.h:127

TMVA::Types::ETreeType
ETreeType
Definition: Types.h:143

TMVA::Types::kTraining
@ kTraining
Definition: Types.h:144

TMatrixT< Double_t >

TString
Basic string class.
Definition: TString.h:131

n
const Int_t n
Definition: legend1.C:16

TMVA
Abstract ClassifierFactory template that handles arbitrary types.
Definition: GeneticMinimizer.h:21

TMath::Gamma
Double_t Gamma(Double_t z)
Computation of gamma(z) for all z.
Definition: TMath.cxx:348

TNeuron.h