doc/v606/MethodMLP_8cxx_source.html

 // @(#)root/tmva $Id$

 // Author: Krzysztof Danielowski, Andreas Hoecker, Matt Jachowski, Kamil Kraszewski, Maciej Kruk, Peter Speckmayer, Joerg Stelzer, Eckhard v. Toerne, Jan Therhaag, Jiahang Zhong


 /**********************************************************************************

  * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

  * Package: TMVA                                                                  *

  * Class  : MethodMLP                                                             *

  * Web    : http://tmva.sourceforge.net                                           *

  *                                                                                *

  * Description:                                                                   *

  *      ANN Multilayer Perceptron class for the discrimination of signal          *

  *      from background. BFGS implementation based on TMultiLayerPerceptron       *

  *      class from ROOT (http://root.cern.ch).                                    *

  *                                                                                *

  * Authors (alphabetical):                                                        *

  *      Krzysztof Danielowski <danielow@cern.ch>       - IFJ & AGH, Poland        *

  *      Andreas Hoecker       <Andreas.Hocker@cern.ch> - CERN, Switzerland        *

  *      Matt Jachowski        <jachowski@stanford.edu> - Stanford University, USA *

  *      Kamil Kraszewski      <kalq@cern.ch>           - IFJ & UJ, Poland         *

  *      Maciej Kruk           <mkruk@cern.ch>          - IFJ & AGH, Poland        *

  *      Peter Speckmayer      <peter.speckmayer@cern.ch> - CERN, Switzerland      *

  *      Joerg Stelzer         <stelzer@cern.ch>        - DESY, Germany            *

  *      Jan Therhaag          <Jan.Therhaag@cern.ch>     - U of Bonn, Germany     *

  *      Eckhard v. Toerne     <evt@uni-bonn.de>          - U of Bonn, Germany     *

  *      Jiahang Zhong         <Jiahang.Zhong@cern.ch>  - Academia Sinica, Taipei  *

  *                                                                                *

  * Copyright (c) 2005-2011:                                                       *

  *      CERN, Switzerland                                                         *

  *      U. of Victoria, Canada                                                    *

  *      MPI-K Heidelberg, Germany                                                 *

  *      U. of Bonn, Germany                                                       *

  *                                                                                *

  * Redistribution and use in source and binary forms, with or without             *

  * modification, are permitted according to the terms listed in LICENSE           *

  * (http://tmva.sourceforge.net/LICENSE)                                          *

  **********************************************************************************/


 //_______________________________________________________________________

 //

 // Multilayer Perceptron class built off of MethodANNBase

 //_______________________________________________________________________


 #include "TString.h"

 #include <vector>

 #include <cmath>

 #include "TTree.h"

 #include "Riostream.h"

 #include "TFitter.h"

 #include "TMatrixD.h"

 #include "TMath.h"

 #include "TFile.h"


 #include "TMVA/ClassifierFactory.h"

 #include "TMVA/Interval.h"

 #include "TMVA/MethodMLP.h"

 #include "TMVA/TNeuron.h"

 #include "TMVA/TSynapse.h"

 #include "TMVA/Timer.h"

 #include "TMVA/Types.h"

 #include "TMVA/Tools.h"

 #include "TMVA/GeneticFitter.h"

 #include "TMVA/Config.h"


 #ifdef MethodMLP_UseMinuit__

 TMVA::MethodMLP* TMVA::MethodMLP::fgThis = 0;

 Bool_t MethodMLP_UseMinuit = kTRUE;

 #endif


 REGISTER_METHOD(MLP)


 ClassImp(TMVA::MethodMLP)


 using std::vector;


 ////////////////////////////////////////////////////////////////////////////////

 /// standard constructor


 TMVA::MethodMLP::MethodMLP( const TString& jobName,

                             const TString& methodTitle,

                             DataSetInfo& theData,

                             const TString& theOption,

                             TDirectory* theTargetDir )

    : MethodANNBase( jobName, Types::kMLP, methodTitle, theData, theOption, theTargetDir ),

      fUseRegulator(false), fCalculateErrors(false),

      fPrior(0.0), fPriorDev(0), fUpdateLimit(0),

      fTrainingMethod(kBFGS), fTrainMethodS("BFGS"),

      fSamplingFraction(1.0), fSamplingEpoch(0.0), fSamplingWeight(0.0),

      fSamplingTraining(false), fSamplingTesting(false),

      fLastAlpha(0.0), fTau(0.),

      fResetStep(0), fLearnRate(0.0), fDecayRate(0.0),

      fBPMode(kSequential), fBpModeS("None"),

      fBatchSize(0), fTestRate(0), fEpochMon(false),

      fGA_nsteps(0), fGA_preCalc(0), fGA_SC_steps(0),

      fGA_SC_rate(0), fGA_SC_factor(0.0),

      fDeviationsFromTargets(0),

      fWeightRange     (1.0)

 {

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// constructor from a weight file


 TMVA::MethodMLP::MethodMLP( DataSetInfo& theData,

                             const TString& theWeightFile,

                             TDirectory* theTargetDir )

    : MethodANNBase( Types::kMLP, theData, theWeightFile, theTargetDir ),

      fUseRegulator(false), fCalculateErrors(false),

      fPrior(0.0), fPriorDev(0), fUpdateLimit(0),

      fTrainingMethod(kBFGS), fTrainMethodS("BFGS"),

      fSamplingFraction(1.0), fSamplingEpoch(0.0), fSamplingWeight(0.0),

      fSamplingTraining(false), fSamplingTesting(false),

      fLastAlpha(0.0), fTau(0.),

      fResetStep(0), fLearnRate(0.0), fDecayRate(0.0),

      fBPMode(kSequential), fBpModeS("None"),

      fBatchSize(0), fTestRate(0), fEpochMon(false),

      fGA_nsteps(0), fGA_preCalc(0), fGA_SC_steps(0),

      fGA_SC_rate(0), fGA_SC_factor(0.0),

      fDeviationsFromTargets(0),

      fWeightRange     (1.0)

 {

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// destructor

 /// nothing to be done


 TMVA::MethodMLP::~MethodMLP()

 {

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// MLP can handle classification with 2 classes and regression with one regression-target


 Bool_t TMVA::MethodMLP::HasAnalysisType( Types::EAnalysisType type, UInt_t numberClasses, UInt_t /*numberTargets*/ )

 {

    if (type == Types::kClassification && numberClasses == 2 ) return kTRUE;

    if (type == Types::kMulticlass ) return kTRUE;

    if (type == Types::kRegression ) return kTRUE;


    return kFALSE;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// default initializations


 void TMVA::MethodMLP::Init()

 {

    // the minimum requirement to declare an event signal-like

    SetSignalReferenceCut( 0.5 );

 #ifdef MethodMLP_UseMinuit__

    fgThis = this;

 #endif

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// define the options (their key words) that can be set in the option string

 /// know options:

 /// TrainingMethod  <string>     Training method

 ///    available values are:         BP   Back-Propagation <default>

 ///                                  GA   Genetic Algorithm (takes a LONG time)

 ///

 /// LearningRate    <float>      NN learning rate parameter

 /// DecayRate       <float>      Decay rate for learning parameter

 /// TestRate        <int>        Test for overtraining performed at each #th epochs

 ///

 /// BPMode          <string>     Back-propagation learning mode

 ///    available values are:         sequential <default>

 ///                                  batch

 ///

 /// BatchSize       <int>        Batch size: number of events/batch, only set if in Batch Mode,

 ///                                          -1 for BatchSize=number_of_events


 void TMVA::MethodMLP::DeclareOptions()

 {

    DeclareOptionRef(fTrainMethodS="BP", "TrainingMethod",

                     "Train with Back-Propagation (BP), BFGS Algorithm (BFGS), or Genetic Algorithm (GA - slower and worse)");

    AddPreDefVal(TString("BP"));

    AddPreDefVal(TString("GA"));

    AddPreDefVal(TString("BFGS"));


    DeclareOptionRef(fLearnRate=0.02,    "LearningRate",    "ANN learning rate parameter");

    DeclareOptionRef(fDecayRate=0.01,    "DecayRate",       "Decay rate for learning parameter");

    DeclareOptionRef(fTestRate =10,      "TestRate",        "Test for overtraining performed at each #th epochs");

    DeclareOptionRef(fEpochMon = kFALSE, "EpochMonitoring", "Provide epoch-wise monitoring plots according to TestRate (caution: causes big ROOT output file!)" );


    DeclareOptionRef(fSamplingFraction=1.0, "Sampling","Only 'Sampling' (randomly selected) events are trained each epoch");

    DeclareOptionRef(fSamplingEpoch=1.0,    "SamplingEpoch","Sampling is used for the first 'SamplingEpoch' epochs, afterwards, all events are taken for training");

    DeclareOptionRef(fSamplingWeight=1.0,    "SamplingImportance"," The sampling weights of events in epochs which successful (worse estimator than before) are multiplied with SamplingImportance, else they are divided.");


    DeclareOptionRef(fSamplingTraining=kTRUE,    "SamplingTraining","The training sample is sampled");

    DeclareOptionRef(fSamplingTesting= kFALSE,    "SamplingTesting" ,"The testing sample is sampled");


    DeclareOptionRef(fResetStep=50,   "ResetStep",    "How often BFGS should reset history");

    DeclareOptionRef(fTau      =3.0,  "Tau",          "LineSearch \"size step\"");


    DeclareOptionRef(fBpModeS="sequential", "BPMode",

                     "Back-propagation learning mode: sequential or batch");

    AddPreDefVal(TString("sequential"));

    AddPreDefVal(TString("batch"));


    DeclareOptionRef(fBatchSize=-1, "BatchSize",

                     "Batch size: number of events/batch, only set if in Batch Mode, -1 for BatchSize=number_of_events");


    DeclareOptionRef(fImprovement=1e-30, "ConvergenceImprove",

                     "Minimum improvement which counts as improvement (<0 means automatic convergence check is turned off)");


    DeclareOptionRef(fSteps=-1, "ConvergenceTests",

                     "Number of steps (without improvement) required for convergence (<0 means automatic convergence check is turned off)");


    DeclareOptionRef(fUseRegulator=kFALSE, "UseRegulator",

                     "Use regulator to avoid over-training");   //zjh

    DeclareOptionRef(fUpdateLimit=10000, "UpdateLimit",

           "Maximum times of regulator update");   //zjh

    DeclareOptionRef(fCalculateErrors=kFALSE, "CalculateErrors",

                     "Calculates inverse Hessian matrix at the end of the training to be able to calculate the uncertainties of an MVA value");   //zjh


    DeclareOptionRef(fWeightRange=1.0, "WeightRange",

                     "Take the events for the estimator calculations from small deviations from the desired value to large deviations only over the weight range");


 }


 ////////////////////////////////////////////////////////////////////////////////

 /// process user options


 void TMVA::MethodMLP::ProcessOptions()

 {

    MethodANNBase::ProcessOptions();


    if (IgnoreEventsWithNegWeightsInTraining()) {

       Log() << kINFO

             << "Will ignore negative events in training!"

             << Endl;

    }


    if      (fTrainMethodS == "BP"  ) fTrainingMethod = kBP;

    else if (fTrainMethodS == "BFGS") fTrainingMethod = kBFGS;

    else if (fTrainMethodS == "GA"  ) fTrainingMethod = kGA;


    if      (fBpModeS == "sequential") fBPMode = kSequential;

    else if (fBpModeS == "batch")      fBPMode = kBatch;


    //   InitializeLearningRates();


    if (fBPMode == kBatch) {

       Data()->SetCurrentType(Types::kTraining);

       Int_t numEvents = Data()->GetNEvents();

       if (fBatchSize < 1 || fBatchSize > numEvents) fBatchSize = numEvents;

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// initialize learning rates of synapses, used only by backpropagation


 void TMVA::MethodMLP::InitializeLearningRates()

 {

    Log() << kDEBUG << "Initialize learning rates" << Endl;

    TSynapse *synapse;

    Int_t numSynapses = fSynapses->GetEntriesFast();

    for (Int_t i = 0; i < numSynapses; i++) {

       synapse = (TSynapse*)fSynapses->At(i);

       synapse->SetLearningRate(fLearnRate);

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// calculate the estimator that training is attempting to minimize


 Double_t TMVA::MethodMLP::CalculateEstimator( Types::ETreeType treeType, Int_t iEpoch )

 {

    // sanity check

    if (treeType!=Types::kTraining && treeType!=Types::kTesting) {

       Log() << kFATAL << "<CalculateEstimator> fatal error: wrong tree type: " << treeType << Endl;

    }


    Types::ETreeType saveType = Data()->GetCurrentType();

    Data()->SetCurrentType(treeType);


    // if epochs are counted create monitoring histograms (only available for classification)

    TString type  = (treeType == Types::kTraining ? "train" : "test");

    TString name  = Form("convergencetest___mlp_%s_epoch_%04i", type.Data(), iEpoch);

    TString nameB = name + "_B";

    TString nameS = name + "_S";

    Int_t   nbin  = 100;

    Float_t limit = 2;

    TH1*    histS = 0;

    TH1*    histB = 0;

    if (fEpochMon && iEpoch >= 0 && !DoRegression()) {

       histS = new TH1F( nameS, nameS, nbin, -limit, limit );

       histB = new TH1F( nameB, nameB, nbin, -limit, limit );

    }


    Double_t estimator = 0;


    // loop over all training events

    Int_t  nEvents  = GetNEvents();

    UInt_t nClasses = DataInfo().GetNClasses();

    UInt_t nTgts = DataInfo().GetNTargets();


    Float_t sumOfWeights = 0.f;

    if( fWeightRange < 1.f ){

       fDeviationsFromTargets = new std::vector<std::pair<Float_t,Float_t> >(nEvents);

    }


    for (Int_t i = 0; i < nEvents; i++) {


       const Event* ev = GetEvent(i);


       if ((ev->GetWeight() < 0) && IgnoreEventsWithNegWeightsInTraining()

           &&  (saveType == Types::kTraining)){

          continue;

       }


        Double_t     w  = ev->GetWeight();


       ForceNetworkInputs( ev );

       ForceNetworkCalculations();


       Double_t d = 0, v = 0;

       if (DoRegression()) {

          for (UInt_t itgt = 0; itgt < nTgts; itgt++) {

             v = GetOutputNeuron( itgt )->GetActivationValue();

             Double_t targetValue = ev->GetTarget( itgt );

             Double_t dt = v - targetValue;

             d += (dt*dt);

          }

          estimator += d*w;

       } else if (DoMulticlass() ) {

          UInt_t cls = ev->GetClass();

          if (fEstimator==kCE){

             Double_t norm(0);

             for (UInt_t icls = 0; icls < nClasses; icls++) {

           Float_t activationValue = GetOutputNeuron( icls )->GetActivationValue();

                norm += exp( activationValue );

                if(icls==cls)

                   d = exp( activationValue );

             }

             d = -TMath::Log(d/norm);

          }

          else{

             for (UInt_t icls = 0; icls < nClasses; icls++) {

                Double_t desired = (icls==cls) ? 1.0 : 0.0;

                v = GetOutputNeuron( icls )->GetActivationValue();

                d = (desired-v)*(desired-v);

             }

          }

          estimator += d*w; //zjh

       } else {

          Double_t desired =  DataInfo().IsSignal(ev)?1.:0.;

          v = GetOutputNeuron()->GetActivationValue();

          if (fEstimator==kMSE) d = (desired-v)*(desired-v);                         //zjh

          else if (fEstimator==kCE) d = -2*(desired*TMath::Log(v)+(1-desired)*TMath::Log(1-v));     //zjh

          estimator += d*w; //zjh

       }


       if( fDeviationsFromTargets )

     fDeviationsFromTargets->push_back(std::pair<Float_t,Float_t>(d,w));


       sumOfWeights += w;


       // fill monitoring histograms

       if (DataInfo().IsSignal(ev) && histS != 0) histS->Fill( float(v), float(w) );

       else if              (histB != 0) histB->Fill( float(v), float(w) );

    }


    if( fDeviationsFromTargets ) {

       std::sort(fDeviationsFromTargets->begin(),fDeviationsFromTargets->end());


       Float_t sumOfWeightsInRange = fWeightRange*sumOfWeights;

       estimator = 0.f;


       Float_t weightRangeCut = fWeightRange*sumOfWeights;

       Float_t weightSum      = 0.f;

       for(std::vector<std::pair<Float_t,Float_t> >::iterator itDev = fDeviationsFromTargets->begin(), itDevEnd = fDeviationsFromTargets->end(); itDev != itDevEnd; ++itDev ){

     float deviation = (*itDev).first;

     float devWeight = (*itDev).second;

     weightSum += devWeight; // add the weight of this event

     if( weightSum <= weightRangeCut ) { // if within the region defined by fWeightRange

        estimator += devWeight*deviation;

     }

       }


       sumOfWeights = sumOfWeightsInRange;

       delete fDeviationsFromTargets;

    }


    if (histS != 0) fEpochMonHistS.push_back( histS );

    if (histB != 0) fEpochMonHistB.push_back( histB );


    //if      (DoRegression()) estimator = TMath::Sqrt(estimator/Float_t(nEvents));

    //else if (DoMulticlass()) estimator = TMath::Sqrt(estimator/Float_t(nEvents));

    //else                     estimator = estimator*0.5/Float_t(nEvents);

    if      (DoRegression()) estimator = estimator/Float_t(sumOfWeights);

    else if (DoMulticlass()) estimator = estimator/Float_t(sumOfWeights);

    else                     estimator = estimator/Float_t(sumOfWeights);


    //if (fUseRegulator) estimator+=fPrior/Float_t(nEvents);  //zjh


    Data()->SetCurrentType( saveType );


    // provide epoch-wise monitoring

    if (fEpochMon && iEpoch >= 0 && !DoRegression() && treeType == Types::kTraining) {

       CreateWeightMonitoringHists( Form("epochmonitoring___epoch_%04i_weights_hist", iEpoch), &fEpochMonHistW );

    }


    return estimator;

 }


 ////////////////////////////////////////////////////////////////////////////////


 void TMVA::MethodMLP::Train(Int_t nEpochs)

 {

    if (fNetwork == 0) {

       //Log() << kERROR <<"ANN Network is not initialized, doing it now!"<< Endl;

       Log() << kFATAL <<"ANN Network is not initialized, doing it now!"<< Endl;

       SetAnalysisType(GetAnalysisType());

    }

    Log() << kDEBUG << "reinitalize learning rates" << Endl;

    InitializeLearningRates();

    PrintMessage("Training Network");


    Int_t nEvents=GetNEvents();

    Int_t nSynapses=fSynapses->GetEntriesFast();

    if (nSynapses>nEvents)

       Log()<<kWARNING<<"ANN too complicated: #events="<<nEvents<<"\t#synapses="<<nSynapses<<Endl;


 #ifdef MethodMLP_UseMinuit__

    if (useMinuit) MinuitMinimize();

 #else

    if (fTrainingMethod == kGA)        GeneticMinimize();

    else if (fTrainingMethod == kBFGS) BFGSMinimize(nEpochs);

    else                               BackPropagationMinimize(nEpochs);

 #endif


    float trainE = CalculateEstimator( Types::kTraining, 0 ) ; // estimator for training sample  //zjh

    float testE  = CalculateEstimator( Types::kTesting,  0 ) ; // estimator for test sample //zjh

    if (fUseRegulator){

       Log()<<kINFO<<"Finalizing handling of Regulator terms, trainE="<<trainE<<" testE="<<testE<<Endl;

       UpdateRegulators();

       Log()<<kINFO<<"Done with handling of Regulator terms"<<Endl;

    }


    if( fCalculateErrors || fUseRegulator )

    {

       Int_t numSynapses=fSynapses->GetEntriesFast();

       fInvHessian.ResizeTo(numSynapses,numSynapses);

       GetApproxInvHessian( fInvHessian ,false);

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// train network with BFGS algorithm


 void TMVA::MethodMLP::BFGSMinimize( Int_t nEpochs )

 {

    Timer timer( (fSteps>0?100:nEpochs), GetName() );


    // create histograms for overtraining monitoring

    Int_t nbinTest = Int_t(nEpochs/fTestRate);

    fEstimatorHistTrain = new TH1F( "estimatorHistTrain", "training estimator",

                                    nbinTest, Int_t(fTestRate/2), nbinTest*fTestRate+Int_t(fTestRate/2) );

    fEstimatorHistTest  = new TH1F( "estimatorHistTest", "test estimator",

                                    nbinTest, Int_t(fTestRate/2), nbinTest*fTestRate+Int_t(fTestRate/2) );


    Int_t nSynapses = fSynapses->GetEntriesFast();

    Int_t nWeights  = nSynapses;


    for (Int_t i=0;i<nSynapses;i++) {

       TSynapse* synapse = (TSynapse*)fSynapses->At(i);

       synapse->SetDEDw(0.0);

    }


    std::vector<Double_t> buffer( nWeights );

    for (Int_t i=0;i<nWeights;i++) buffer[i] = 0.;


    TMatrixD Dir     ( nWeights, 1 );

    TMatrixD Hessian ( nWeights, nWeights );

    TMatrixD Gamma   ( nWeights, 1 );

    TMatrixD Delta   ( nWeights, 1 );

    Int_t        RegUpdateCD=0;                  //zjh

    Int_t        RegUpdateTimes=0;               //zjh

    Double_t     AccuError=0;


    Double_t trainE = -1;

    Double_t testE  = -1;


    fLastAlpha = 0.;


    if(fSamplingTraining || fSamplingTesting)

       Data()->InitSampling(1.0,1.0,fRandomSeed); // initialize sampling to initialize the random generator with the given seed


    if (fSteps > 0) Log() << kINFO << "Inaccurate progress timing for MLP... " << Endl;

    timer.DrawProgressBar( 0 );


    // start training cycles (epochs)

    for (Int_t i = 0; i < nEpochs; i++) {

       if (Float_t(i)/nEpochs < fSamplingEpoch) {

          if ((i+1)%fTestRate == 0 || (i == 0)) {

             if (fSamplingTraining) {

                Data()->SetCurrentType( Types::kTraining );

                Data()->InitSampling(fSamplingFraction,fSamplingWeight);

                Data()->CreateSampling();

             }

             if (fSamplingTesting) {

                Data()->SetCurrentType( Types::kTesting );

                Data()->InitSampling(fSamplingFraction,fSamplingWeight);

                Data()->CreateSampling();

             }

          }

       }

       else {

          Data()->SetCurrentType( Types::kTraining );

          Data()->InitSampling(1.0,1.0);

          Data()->SetCurrentType( Types::kTesting );

          Data()->InitSampling(1.0,1.0);

       }

       Data()->SetCurrentType( Types::kTraining );


       //zjh

       if (fUseRegulator) {

          UpdatePriors();

          RegUpdateCD++;

       }

       //zjh


       SetGammaDelta( Gamma, Delta, buffer );


       if (i % fResetStep == 0 && i<0.5*nEpochs) { //zjh

          SteepestDir( Dir );

          Hessian.UnitMatrix();

          RegUpdateCD=0;    //zjh

       }

       else {

          if (GetHessian( Hessian, Gamma, Delta )) {

             SteepestDir( Dir );

             Hessian.UnitMatrix();

             RegUpdateCD=0;    //zjh

          }

          else SetDir( Hessian, Dir );

       }


       Double_t dError=0;  //zjh

       if (DerivDir( Dir ) > 0) {

          SteepestDir( Dir );

          Hessian.UnitMatrix();

          RegUpdateCD=0;    //zjh

       }

       if (LineSearch( Dir, buffer, &dError )) { //zjh

          Hessian.UnitMatrix();

          SteepestDir( Dir );

          RegUpdateCD=0;    //zjh

          if (LineSearch(Dir, buffer, &dError)) {  //zjh

             i = nEpochs;

             Log() << kFATAL << "Line search failed! Huge troubles somewhere..." << Endl;

          }

       }


       //zjh+

       if (dError<0) Log()<<kWARNING<<"\nnegative dError=" <<dError<<Endl;

       AccuError+=dError;


       if ( fUseRegulator && RegUpdateTimes<fUpdateLimit && RegUpdateCD>=5 && fabs(dError)<0.1*AccuError) {

          Log()<<kDEBUG<<"\n\nUpdate regulators "<<RegUpdateTimes<<" on epoch "<<i<<"\tdError="<<dError<<Endl;

          UpdateRegulators();

          Hessian.UnitMatrix();

          RegUpdateCD=0;

          RegUpdateTimes++;

          AccuError=0;

       }

       //zjh-


       // monitor convergence of training and control sample

       if ((i+1)%fTestRate == 0) {

          //trainE = CalculateEstimator( Types::kTraining, i ) - fPrior/Float_t(GetNEvents()); // estimator for training sample  //zjh

          //testE  = CalculateEstimator( Types::kTesting,  i ) - fPrior/Float_t(GetNEvents()); // estimator for test sample //zjh

          trainE = CalculateEstimator( Types::kTraining, i ) ; // estimator for training sample  //zjh

          testE  = CalculateEstimator( Types::kTesting,  i ) ; // estimator for test sample //zjh

          fEstimatorHistTrain->Fill( i+1, trainE );

          fEstimatorHistTest ->Fill( i+1, testE );


          Bool_t success = kFALSE;

          if ((testE < GetCurrentValue()) || (GetCurrentValue()<1e-100)) {

             success = kTRUE;

          }

          Data()->EventResult( success );


          SetCurrentValue( testE );

          if (HasConverged()) {

             if (Float_t(i)/nEpochs < fSamplingEpoch) {

                Int_t newEpoch = Int_t(fSamplingEpoch*nEpochs);

                i = newEpoch;

                ResetConvergenceCounter();

             }

             else break;

          }

       }


       // draw progress

       TString convText = Form( "<D^2> (train/test/epoch): %.4g/%.4g/%d", trainE, testE,i  ); //zjh

       if (fSteps > 0) {

          Float_t progress = 0;

          if (Float_t(i)/nEpochs < fSamplingEpoch)

 //            progress = Progress()*fSamplingEpoch*fSamplingFraction*100;

             progress = Progress()*fSamplingFraction*100*fSamplingEpoch;

          else

     {

 //            progress = 100.0*(fSamplingEpoch*fSamplingFraction+(1.0-fSamplingFraction*fSamplingEpoch)*Progress());

             progress = 100.0*(fSamplingFraction*fSamplingEpoch+(1.0-fSamplingEpoch)*Progress());

     }

          Float_t progress2= 100.0*RegUpdateTimes/fUpdateLimit; //zjh

          if (progress2>progress) progress=progress2; //zjh

          timer.DrawProgressBar( Int_t(progress), convText );

       }

       else {

          Int_t progress=Int_t(nEpochs*RegUpdateTimes/Float_t(fUpdateLimit)); //zjh

          if (progress<i) progress=i; //zjh

          timer.DrawProgressBar( progress, convText ); //zjh

       }


       // some verbose output

       if (fgPRINT_SEQ) {

          PrintNetwork();

          WaitForKeyboard();

       }

    }

 }


 ////////////////////////////////////////////////////////////////////////////////


 void TMVA::MethodMLP::SetGammaDelta( TMatrixD &Gamma, TMatrixD &Delta, std::vector<Double_t> &buffer )

 {

    Int_t nWeights = fSynapses->GetEntriesFast();


    Int_t IDX = 0;

    Int_t nSynapses = fSynapses->GetEntriesFast();

    for (Int_t i=0;i<nSynapses;i++) {

       TSynapse *synapse = (TSynapse*)fSynapses->At(i);

       Gamma[IDX++][0] = -synapse->GetDEDw();

    }


    for (Int_t i=0;i<nWeights;i++) Delta[i][0] = buffer[i];


    ComputeDEDw();


    IDX = 0;

    for (Int_t i=0;i<nSynapses;i++)

       {

          TSynapse *synapse = (TSynapse*)fSynapses->At(i);

          Gamma[IDX++][0] += synapse->GetDEDw();

       }

 }


 ////////////////////////////////////////////////////////////////////////////////


 void TMVA::MethodMLP::ComputeDEDw()

 {

    Int_t nSynapses = fSynapses->GetEntriesFast();

    for (Int_t i=0;i<nSynapses;i++) {

       TSynapse *synapse = (TSynapse*)fSynapses->At(i);

       synapse->SetDEDw( 0.0 );

    }


    Int_t nEvents = GetNEvents();

    Int_t nPosEvents = nEvents;

    for (Int_t i=0;i<nEvents;i++) {


       const Event* ev = GetEvent(i);

        if ((ev->GetWeight() < 0) && IgnoreEventsWithNegWeightsInTraining()

           &&  (Data()->GetCurrentType() == Types::kTraining)){

          --nPosEvents;

          continue;

       }


       SimulateEvent( ev );


       for (Int_t j=0;j<nSynapses;j++) {

          TSynapse *synapse = (TSynapse*)fSynapses->At(j);

          synapse->SetDEDw( synapse->GetDEDw() + synapse->GetDelta() );

       }

    }


    for (Int_t i=0;i<nSynapses;i++) {

       TSynapse *synapse = (TSynapse*)fSynapses->At(i);

       Double_t DEDw=synapse->GetDEDw();     //zjh

       if (fUseRegulator) DEDw+=fPriorDev[i]; //zjh

       synapse->SetDEDw( DEDw / nPosEvents );   //zjh

    }

 }


 ////////////////////////////////////////////////////////////////////////////////


 void TMVA::MethodMLP::SimulateEvent( const Event* ev )

 {

    Double_t eventWeight = ev->GetWeight();


    ForceNetworkInputs( ev );

    ForceNetworkCalculations();


    if (DoRegression()) {

       UInt_t ntgt = DataInfo().GetNTargets();

       for (UInt_t itgt = 0; itgt < ntgt; itgt++) {

          Double_t desired     = ev->GetTarget(itgt);

          Double_t error = ( GetOutputNeuron( itgt )->GetActivationValue() - desired )*eventWeight;

          GetOutputNeuron( itgt )->SetError(error);

       }

    } else if (DoMulticlass()) {

       UInt_t nClasses = DataInfo().GetNClasses();

       UInt_t cls      = ev->GetClass();

       for (UInt_t icls = 0; icls < nClasses; icls++) {

          Double_t desired  = ( cls==icls ? 1.0 : 0.0 );

          Double_t error    = ( GetOutputNeuron( icls )->GetActivationValue() - desired )*eventWeight;

          GetOutputNeuron( icls )->SetError(error);

       }

    } else {

       Double_t desired     = GetDesiredOutput( ev );

       Double_t error=-1;            //zjh

       if (fEstimator==kMSE) error = ( GetOutputNeuron()->GetActivationValue() - desired )*eventWeight;       //zjh

       else if (fEstimator==kCE) error = -eventWeight/(GetOutputNeuron()->GetActivationValue() -1 + desired);  //zjh

       GetOutputNeuron()->SetError(error);

    }


    CalculateNeuronDeltas();

    for (Int_t j=0;j<fSynapses->GetEntriesFast();j++) {

       TSynapse *synapse = (TSynapse*)fSynapses->At(j);

       synapse->InitDelta();

       synapse->CalculateDelta();

    }

 }


 ////////////////////////////////////////////////////////////////////////////////


 void TMVA::MethodMLP::SteepestDir( TMatrixD &Dir )

 {

    Int_t IDX = 0;

    Int_t nSynapses = fSynapses->GetEntriesFast();


    for (Int_t i=0;i<nSynapses;i++) {

       TSynapse *synapse = (TSynapse*)fSynapses->At(i);

       Dir[IDX++][0] = -synapse->GetDEDw();

    }

 }


 ////////////////////////////////////////////////////////////////////////////////


 Bool_t TMVA::MethodMLP::GetHessian( TMatrixD &Hessian, TMatrixD &Gamma, TMatrixD &Delta )

 {

    TMatrixD gd(Gamma, TMatrixD::kTransposeMult, Delta);

    if ((Double_t) gd[0][0] == 0.) return kTRUE;

    TMatrixD aHg(Hessian, TMatrixD::kMult, Gamma);

    TMatrixD tmp(Gamma,   TMatrixD::kTransposeMult, Hessian);

    TMatrixD gHg(Gamma,   TMatrixD::kTransposeMult, aHg);

    Double_t a = 1 / (Double_t) gd[0][0];

    Double_t f = 1 + ((Double_t)gHg[0][0]*a);

    TMatrixD res(TMatrixD(Delta, TMatrixD::kMult, TMatrixD(TMatrixD::kTransposed,Delta)));

    res *= f;

    res -= (TMatrixD(Delta, TMatrixD::kMult, tmp) + TMatrixD(aHg, TMatrixD::kMult,

                                                             TMatrixD(TMatrixD::kTransposed,Delta)));

    res *= a;

    Hessian += res;


    return kFALSE;

 }


 ////////////////////////////////////////////////////////////////////////////////


 void TMVA::MethodMLP::SetDir( TMatrixD &Hessian, TMatrixD &dir )

 {

    Int_t IDX = 0;

    Int_t nSynapses = fSynapses->GetEntriesFast();

    TMatrixD DEDw(nSynapses, 1);


    for (Int_t i=0;i<nSynapses;i++) {

       TSynapse *synapse = (TSynapse*)fSynapses->At(i);

       DEDw[IDX++][0] = synapse->GetDEDw();

    }


    dir = Hessian * DEDw;

    for (Int_t i=0;i<IDX;i++) dir[i][0] = -dir[i][0];

 }


 ////////////////////////////////////////////////////////////////////////////////


 Double_t TMVA::MethodMLP::DerivDir( TMatrixD &Dir )

 {

    Int_t IDX = 0;

    Int_t nSynapses = fSynapses->GetEntriesFast();

    Double_t Result = 0.0;


    for (Int_t i=0;i<nSynapses;i++) {

       TSynapse *synapse = (TSynapse*)fSynapses->At(i);

       Result += Dir[IDX++][0] * synapse->GetDEDw();

    }

    return Result;

 }


 ////////////////////////////////////////////////////////////////////////////////


 Bool_t TMVA::MethodMLP::LineSearch(TMatrixD &Dir, std::vector<Double_t> &buffer, Double_t* dError)

 {

    Int_t IDX = 0;

    Int_t nSynapses = fSynapses->GetEntriesFast();

    Int_t nWeights = nSynapses;


    std::vector<Double_t> Origin(nWeights);

    for (Int_t i=0;i<nSynapses;i++) {

       TSynapse *synapse = (TSynapse*)fSynapses->At(i);

       Origin[i] = synapse->GetWeight();

    }


    Double_t err1 = GetError();

    Double_t errOrigin=err1;   //zjh

    Double_t alpha1 = 0.;

    Double_t alpha2 = fLastAlpha;


    if      (alpha2 < 0.01) alpha2 = 0.01;

    else if (alpha2 > 2.0)  alpha2 = 2.0;

    Double_t alpha_original = alpha2;

    Double_t alpha3 = alpha2;


    SetDirWeights( Origin, Dir, alpha2 );

    Double_t err2 = GetError();

    //Double_t err2 = err1;

    Double_t err3 = err2;

    Bool_t bingo = kFALSE;


    if (err1 > err2) {

       for (Int_t i=0;i<100;i++)  {

          alpha3 *= fTau;

          SetDirWeights(Origin, Dir, alpha3);

          err3 = GetError();

          if (err3 > err2) {

             bingo = kTRUE;

             break;

          }

          alpha1 = alpha2;

          err1 = err2;

          alpha2 = alpha3;

          err2 = err3;

       }

       if (!bingo) {

          SetDirWeights(Origin, Dir, 0.);

          return kTRUE;

       }

    }

    else {

       for (Int_t i=0;i<100;i++) {

          alpha2 /= fTau;

          if (i==50) {

             Log() << kWARNING << "linesearch, starting to investigate direction opposite of steepestDIR" << Endl;

             alpha2 = -alpha_original;

          }

          SetDirWeights(Origin, Dir, alpha2);

          err2 = GetError();

          if (err1 > err2) {

             bingo = kTRUE;

             break;

          }

          alpha3 = alpha2;

          err3 = err2;

       }

       if (!bingo) {

          SetDirWeights(Origin, Dir, 0.);

          Log() << kWARNING << "linesearch, failed even in opposite direction of steepestDIR" << Endl;

          fLastAlpha = 0.05;

          return kTRUE;

       }

    }


    if (alpha1>0 && alpha2>0 && alpha3 > 0) {

       fLastAlpha = 0.5 * (alpha1 + alpha3 -

                           (err3 - err1) / ((err3 - err2) / ( alpha3 - alpha2 )

                                            - ( err2 - err1 ) / (alpha2 - alpha1 )));

    }

    else {

       fLastAlpha = alpha2;

    }


    fLastAlpha = fLastAlpha < 10000 ? fLastAlpha : 10000;


    SetDirWeights(Origin, Dir, fLastAlpha);


    // leaving these lines uncommented is a heavy price to pay for only a warning message

    // (which shoulnd't appear anyway)

    // --> about 15% of time is spent in the final GetError().

    //

    Double_t finalError = GetError();

    if (finalError > err1) {

       Log() << kWARNING << "Line search increased error! Something is wrong."

             << "fLastAlpha=" << fLastAlpha << "al123=" << alpha1 << " "

             << alpha2 << " " << alpha3 << " err1="<< err1 << " errfinal=" << finalError << Endl;

    }


    for (Int_t i=0;i<nSynapses;i++) {

       TSynapse *synapse = (TSynapse*)fSynapses->At(i);

       buffer[IDX] = synapse->GetWeight() - Origin[IDX];

       IDX++;

    }


    if (dError) (*dError)=(errOrigin-finalError)/finalError; //zjh


    return kFALSE;

 }


 ////////////////////////////////////////////////////////////////////////////////


 void TMVA::MethodMLP::SetDirWeights( std::vector<Double_t> &Origin, TMatrixD &Dir, Double_t alpha )

 {

    Int_t IDX = 0;

    Int_t nSynapses = fSynapses->GetEntriesFast();


    for (Int_t i=0;i<nSynapses;i++) {

       TSynapse *synapse = (TSynapse*)fSynapses->At(i);

       synapse->SetWeight( Origin[IDX] + Dir[IDX][0] * alpha );

       IDX++;

    }

    if (fUseRegulator) UpdatePriors();  //zjh

 }


 ////////////////////////////////////////////////////////////////////////////////


 Double_t TMVA::MethodMLP::GetError()

 {

    Int_t nEvents = GetNEvents();

    UInt_t ntgts = GetNTargets();

    Double_t Result = 0.;


    for (Int_t i=0;i<nEvents;i++) {

       const Event* ev = GetEvent(i);


        if ((ev->GetWeight() < 0) && IgnoreEventsWithNegWeightsInTraining()

           &&  (Data()->GetCurrentType() == Types::kTraining)){

          continue;

       }

       SimulateEvent( ev );


       Double_t error = 0.;

       if (DoRegression()) {

          for (UInt_t itgt = 0; itgt < ntgts; itgt++) {

             error += GetMSEErr( ev, itgt );  //zjh

          }

       } else if ( DoMulticlass() ){

          for( UInt_t icls = 0, iclsEnd = DataInfo().GetNClasses(); icls < iclsEnd; icls++ ){

             error += GetMSEErr( ev, icls );

          }

       } else {

          if (fEstimator==kMSE) error = GetMSEErr( ev );  //zjh

          else if (fEstimator==kCE) error= GetCEErr( ev ); //zjh

       }

       Result += error * ev->GetWeight();

    }

    if (fUseRegulator) Result+=fPrior;  //zjh

    if (Result<0) Log()<<kWARNING<<"\nNegative Error!!! :"<<Result-fPrior<<"+"<<fPrior<<Endl;

    return Result;

 }


 ////////////////////////////////////////////////////////////////////////////////


 Double_t TMVA::MethodMLP::GetMSEErr( const Event* ev, UInt_t index )

 {

    Double_t error = 0;

    Double_t output = GetOutputNeuron( index )->GetActivationValue();

    Double_t target = 0;

    if      (DoRegression()) target = ev->GetTarget( index );

    else if (DoMulticlass()) target = (ev->GetClass() == index ? 1.0 : 0.0 );

    else                     target = GetDesiredOutput( ev );


    error = 0.5*(output-target)*(output-target); //zjh


    return error;


 }


 ////////////////////////////////////////////////////////////////////////////////


 Double_t TMVA::MethodMLP::GetCEErr( const Event* ev, UInt_t index )  //zjh

 {

    Double_t error = 0;

    Double_t output = GetOutputNeuron( index )->GetActivationValue();

    Double_t target = 0;

    if      (DoRegression()) target = ev->GetTarget( index );

    else if (DoMulticlass()) target = (ev->GetClass() == index ? 1.0 : 0.0 );

    else                     target = GetDesiredOutput( ev );


    error = -(target*TMath::Log(output)+(1-target)*TMath::Log(1-output));


    return error;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// minimize estimator / train network with backpropagation algorithm


 void TMVA::MethodMLP::BackPropagationMinimize(Int_t nEpochs)

 {

    //    Timer timer( nEpochs, GetName() );

    Timer timer( (fSteps>0?100:nEpochs), GetName() );

    Int_t lateEpoch = (Int_t)(nEpochs*0.95) - 1;


    // create histograms for overtraining monitoring

    Int_t nbinTest = Int_t(nEpochs/fTestRate);

    fEstimatorHistTrain = new TH1F( "estimatorHistTrain", "training estimator",

                                    nbinTest, Int_t(fTestRate/2), nbinTest*fTestRate+Int_t(fTestRate/2) );

    fEstimatorHistTest  = new TH1F( "estimatorHistTest", "test estimator",

                                    nbinTest, Int_t(fTestRate/2), nbinTest*fTestRate+Int_t(fTestRate/2) );


    if(fSamplingTraining || fSamplingTesting)

       Data()->InitSampling(1.0,1.0,fRandomSeed); // initialize sampling to initialize the random generator with the given seed


    if (fSteps > 0) Log() << kINFO << "Inaccurate progress timing for MLP... " << Endl;

    timer.DrawProgressBar(0);


    // estimators

    Double_t trainE = -1;

    Double_t testE  = -1;


    // start training cycles (epochs)

    for (Int_t i = 0; i < nEpochs; i++) {


       if (Float_t(i)/nEpochs < fSamplingEpoch) {

          if ((i+1)%fTestRate == 0 || (i == 0)) {

             if (fSamplingTraining) {

                Data()->SetCurrentType( Types::kTraining );

                Data()->InitSampling(fSamplingFraction,fSamplingWeight);

                Data()->CreateSampling();

             }

             if (fSamplingTesting) {

                Data()->SetCurrentType( Types::kTesting );

                Data()->InitSampling(fSamplingFraction,fSamplingWeight);

                Data()->CreateSampling();

             }

          }

       }

       else {

          Data()->SetCurrentType( Types::kTraining );

          Data()->InitSampling(1.0,1.0);

          Data()->SetCurrentType( Types::kTesting );

          Data()->InitSampling(1.0,1.0);

       }

       Data()->SetCurrentType( Types::kTraining );


       TrainOneEpoch();

       DecaySynapseWeights(i >= lateEpoch);


       // monitor convergence of training and control sample

       if ((i+1)%fTestRate == 0) {

          trainE = CalculateEstimator( Types::kTraining, i ); // estimator for training sample

          testE  = CalculateEstimator( Types::kTesting,  i );  // estimator for test samplea

          fEstimatorHistTrain->Fill( i+1, trainE );

          fEstimatorHistTest ->Fill( i+1, testE );


          Bool_t success = kFALSE;

          if ((testE < GetCurrentValue()) || (GetCurrentValue()<1e-100)) {

             success = kTRUE;

          }

          Data()->EventResult( success );


          SetCurrentValue( testE );

          if (HasConverged()) {

             if (Float_t(i)/nEpochs < fSamplingEpoch) {

                Int_t newEpoch = Int_t(fSamplingEpoch*nEpochs);

                i = newEpoch;

                ResetConvergenceCounter();

             }

             else {

                if (lateEpoch > i) lateEpoch = i;

                else                break;

             }

          }

       }


       // draw progress bar (add convergence value)

       TString convText = Form( "<D^2> (train/test): %.4g/%.4g", trainE, testE );

       if (fSteps > 0) {

          Float_t progress = 0;

          if (Float_t(i)/nEpochs < fSamplingEpoch)

             progress = Progress()*fSamplingEpoch*fSamplingFraction*100;

          else

             progress = 100*(fSamplingEpoch*fSamplingFraction+(1.0-fSamplingFraction*fSamplingEpoch)*Progress());


          timer.DrawProgressBar( Int_t(progress), convText );

       }

       else {

         timer.DrawProgressBar( i, convText );

       }

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// train network over a single epoch/cyle of events


 void TMVA::MethodMLP::TrainOneEpoch()

 {

    Int_t nEvents = Data()->GetNEvents();


    // randomize the order events will be presented, important for sequential mode

    Int_t* index = new Int_t[nEvents];

    for (Int_t i = 0; i < nEvents; i++) index[i] = i;

    Shuffle(index, nEvents);


    // loop over all training events

    for (Int_t i = 0; i < nEvents; i++) {


       const Event * ev = GetEvent(index[i]);

       if ((ev->GetWeight() < 0) && IgnoreEventsWithNegWeightsInTraining()

           &&  (Data()->GetCurrentType() == Types::kTraining)){

          continue;

       }


       TrainOneEvent(index[i]);


       // do adjustments if in batch mode

       if (fBPMode == kBatch && (i+1)%fBatchSize == 0) {

          AdjustSynapseWeights();

          if (fgPRINT_BATCH) {

             PrintNetwork();

             WaitForKeyboard();

          }

       }


       // debug in sequential mode

       if (fgPRINT_SEQ) {

          PrintNetwork();

          WaitForKeyboard();

       }

    }


    delete[] index;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// Input:

 ///   index: the array to shuffle

 ///   n: the size of the array

 /// Output:

 ///   index: the shuffled indexes

 /// This method is used for sequential training


 void TMVA::MethodMLP::Shuffle(Int_t* index, Int_t n)

 {

    Int_t j, k;

    Int_t a = n - 1;

    for (Int_t i = 0; i < n; i++) {

       j = (Int_t) (frgen->Rndm() * a);

       if (j<n){ // address the 'worries' of coverity

    k = index[j];

    index[j] = index[i];

    index[i] = k;

       }

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// decay synapse weights

 /// in last 10 epochs, lower learning rate even more to find a good minimum


 void TMVA::MethodMLP::DecaySynapseWeights(Bool_t lateEpoch)

 {

    TSynapse* synapse;

    Int_t numSynapses = fSynapses->GetEntriesFast();

    for (Int_t i = 0; i < numSynapses; i++) {

       synapse = (TSynapse*)fSynapses->At(i);

       if (lateEpoch) synapse->DecayLearningRate(TMath::Sqrt(fDecayRate)); // In order to lower the learning rate even more, we need to apply sqrt instead of square.

       else           synapse->DecayLearningRate(fDecayRate);

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// fast per-event training


 void TMVA::MethodMLP::TrainOneEventFast(Int_t ievt, Float_t*& branchVar, Int_t& type)

 {

    GetEvent(ievt);


    // as soon as we know how to get event weights, get that here


    // note: the normalization of event weights will affect the choice

    // of learning rate, one will have to experiment to get the right value.

    // in general, if the "average" event weight is 1, the learning rate

    // should be good if set around 0.02 (a good value if all event weights are 1)

    Double_t eventWeight = 1.0;


    // get the desired output of this event

    Double_t desired;

    if (type == 0) desired = fOutput->GetMin();  // background //zjh

    else           desired = fOutput->GetMax();  // signal     //zjh


    // force the value for each input neuron

    Double_t x;

    TNeuron* neuron;


    for (UInt_t j = 0; j < GetNvar(); j++) {

       x = branchVar[j];

       if (IsNormalised()) x = gTools().NormVariable( x, GetXmin( j ), GetXmax( j ) );

       neuron = GetInputNeuron(j);

       neuron->ForceValue(x);

    }


    ForceNetworkCalculations();

    UpdateNetwork(desired, eventWeight);

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// train network over a single event

 /// this uses the new event model


 void TMVA::MethodMLP::TrainOneEvent(Int_t ievt)

 {

    // note: the normalization of event weights will affect the choice

    // of learning rate, one will have to experiment to get the right value.

    // in general, if the "average" event weight is 1, the learning rate

    // should be good if set around 0.02 (a good value if all event weights are 1)


    const Event * ev = GetEvent(ievt);

    Double_t eventWeight = ev->GetWeight();

    ForceNetworkInputs( ev );

    ForceNetworkCalculations();

    if (DoRegression()) UpdateNetwork( ev->GetTargets(),       eventWeight );

    if (DoMulticlass()) UpdateNetwork( *DataInfo().GetTargetsForMulticlass( ev ), eventWeight );

    else                UpdateNetwork( GetDesiredOutput( ev ), eventWeight );

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// get the desired output of this event


 Double_t TMVA::MethodMLP::GetDesiredOutput( const Event* ev )

 {

    return DataInfo().IsSignal(ev)?fOutput->GetMax():fOutput->GetMin(); //zjh

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// update the network based on how closely

 /// the output matched the desired output


 void TMVA::MethodMLP::UpdateNetwork(Double_t desired, Double_t eventWeight)

 {

    Double_t error = GetOutputNeuron()->GetActivationValue() - desired;

    if (fEstimator==kMSE)  error = GetOutputNeuron()->GetActivationValue() - desired ;  //zjh

    else if (fEstimator==kCE)  error = -1./(GetOutputNeuron()->GetActivationValue() -1 + desired); //zjh

    else  Log() << kFATAL << "Estimator type unspecified!!" << Endl;              //zjh

    error *= eventWeight;

    GetOutputNeuron()->SetError(error);

    CalculateNeuronDeltas();

    UpdateSynapses();

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// update the network based on how closely

 /// the output matched the desired output


 void TMVA::MethodMLP::UpdateNetwork(const std::vector<Float_t>& desired, Double_t eventWeight)

 {

    for (UInt_t i = 0, iEnd = desired.size(); i < iEnd; ++i) {

       Double_t error = GetOutputNeuron( i )->GetActivationValue() - desired.at(i);

       error *= eventWeight;

       GetOutputNeuron( i )->SetError(error);

    }

    CalculateNeuronDeltas();

    UpdateSynapses();

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// have each neuron calculate its delta by backpropagation


 void TMVA::MethodMLP::CalculateNeuronDeltas()

 {

    TNeuron* neuron;

    Int_t    numNeurons;

    Int_t    numLayers = fNetwork->GetEntriesFast();

    TObjArray* curLayer;


    // step backwards through the network (backpropagation)

    // deltas calculated starting at output layer

    for (Int_t i = numLayers-1; i >= 0; i--) {

       curLayer = (TObjArray*)fNetwork->At(i);

       numNeurons = curLayer->GetEntriesFast();


       for (Int_t j = 0; j < numNeurons; j++) {

          neuron = (TNeuron*) curLayer->At(j);

          neuron->CalculateDelta();

       }

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// create genetics class similar to GeneticCut

 /// give it vector of parameter ranges (parameters = weights)

 /// link fitness function of this class to ComputeEstimator

 /// instantiate GA (see MethodCuts)

 /// run it

 /// then this should exist for GA, Minuit and random sampling


 void TMVA::MethodMLP::GeneticMinimize()

 {

    PrintMessage("Minimizing Estimator with GA");


    // define GA parameters

    fGA_preCalc   = 1;

    fGA_SC_steps  = 10;

    fGA_SC_rate   = 5;

    fGA_SC_factor = 0.95;

    fGA_nsteps    = 30;


    // ranges

    std::vector<Interval*> ranges;


    Int_t numWeights = fSynapses->GetEntriesFast();

    for (Int_t ivar=0; ivar< numWeights; ivar++) {

       ranges.push_back( new Interval( 0, GetXmax(ivar) - GetXmin(ivar) ));

    }


    FitterBase *gf = new GeneticFitter( *this, Log().GetPrintedSource(), ranges, GetOptions() );

    gf->Run();


    Double_t estimator = CalculateEstimator();

    Log() << kINFO << "GA: estimator after optimization: " << estimator << Endl;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// interface to the estimate


 Double_t TMVA::MethodMLP::EstimatorFunction( std::vector<Double_t>& parameters)

 {

    return ComputeEstimator( parameters );

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// this function is called by GeneticANN for GA optimization


 Double_t TMVA::MethodMLP::ComputeEstimator( std::vector<Double_t>& parameters)

 {

    TSynapse* synapse;

    Int_t numSynapses = fSynapses->GetEntriesFast();


    for (Int_t i = 0; i < numSynapses; i++) {

       synapse = (TSynapse*)fSynapses->At(i);

       synapse->SetWeight(parameters.at(i));

    }

    if (fUseRegulator) UpdatePriors(); //zjh


    Double_t estimator = CalculateEstimator();


    return estimator;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// update synapse error fields and adjust the weights (if in sequential mode)


 void TMVA::MethodMLP::UpdateSynapses()

 {

    TNeuron* neuron;

    Int_t numNeurons;

    TObjArray* curLayer;

    Int_t numLayers = fNetwork->GetEntriesFast();


    for (Int_t i = 0; i < numLayers; i++) {

       curLayer = (TObjArray*)fNetwork->At(i);

       numNeurons = curLayer->GetEntriesFast();


       for (Int_t j = 0; j < numNeurons; j++) {

          neuron = (TNeuron*) curLayer->At(j);

          if (fBPMode == kBatch) neuron->UpdateSynapsesBatch();

          else                neuron->UpdateSynapsesSequential();

       }

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// just adjust the synapse weights (should be called in batch mode)


 void TMVA::MethodMLP::AdjustSynapseWeights()

 {

    TNeuron* neuron;

    Int_t numNeurons;

    TObjArray* curLayer;

    Int_t numLayers = fNetwork->GetEntriesFast();


    for (Int_t i = numLayers-1; i >= 0; i--) {

       curLayer = (TObjArray*)fNetwork->At(i);

       numNeurons = curLayer->GetEntriesFast();


       for (Int_t j = 0; j < numNeurons; j++) {

          neuron = (TNeuron*) curLayer->At(j);

          neuron->AdjustSynapseWeights();

       }

    }

 }


 ////////////////////////////////////////////////////////////////////////////////


 void TMVA::MethodMLP::UpdatePriors()  //zjh

 {

    fPrior=0;

    fPriorDev.clear();

    Int_t nSynapses = fSynapses->GetEntriesFast();

    for (Int_t i=0;i<nSynapses;i++) {

       TSynapse* synapse = (TSynapse*)fSynapses->At(i);

       fPrior+=0.5*fRegulators[fRegulatorIdx[i]]*(synapse->GetWeight())*(synapse->GetWeight());

       fPriorDev.push_back(fRegulators[fRegulatorIdx[i]]*(synapse->GetWeight()));

    }

 }


 ////////////////////////////////////////////////////////////////////////////////


 void TMVA::MethodMLP::UpdateRegulators()  //zjh

 {

    TMatrixD InvH(0,0);

    GetApproxInvHessian(InvH);

    Int_t numSynapses=fSynapses->GetEntriesFast();

    Int_t numRegulators=fRegulators.size();

    Float_t gamma=0,

       variance=1.;    // Gaussian noise

    std::vector<Int_t> nWDP(numRegulators);

    std::vector<Double_t> trace(numRegulators),weightSum(numRegulators);

    for (int i=0;i<numSynapses;i++) {

       TSynapse* synapses = (TSynapse*)fSynapses->At(i);

       Int_t idx=fRegulatorIdx[i];

       nWDP[idx]++;

       trace[idx]+=InvH[i][i];

       gamma+=1-fRegulators[idx]*InvH[i][i];

       weightSum[idx]+=(synapses->GetWeight())*(synapses->GetWeight());

    }

    if (fEstimator==kMSE) {

       if (GetNEvents()>gamma) variance=CalculateEstimator( Types::kTraining, 0 )/(1-(gamma/GetNEvents()));

       else variance=CalculateEstimator( Types::kTraining, 0 );

    }


    //Log() << kDEBUG << Endl;

    for (int i=0;i<numRegulators;i++)

       {

          //fRegulators[i]=variance*(nWDP[i]-fRegulators[i]*trace[i])/weightSum[i];

          fRegulators[i]=variance*nWDP[i]/(weightSum[i]+variance*trace[i]);

          if (fRegulators[i]<0) fRegulators[i]=0;

          Log()<<kDEBUG<<"R"<<i<<":"<<fRegulators[i]<<"\t";

       }

    float trainE = CalculateEstimator( Types::kTraining, 0 ) ; // estimator for training sample  //zjh

    float testE  = CalculateEstimator( Types::kTesting,  0 ) ; // estimator for test sample //zjh


    Log()<<kDEBUG<<"\n"<<"trainE:"<<trainE<<"\ttestE:"<<testE<<"\tvariance:"<<variance<<"\tgamma:"<<gamma<<Endl;


 }


 ////////////////////////////////////////////////////////////////////////////////


 void TMVA::MethodMLP::GetApproxInvHessian(TMatrixD& InvHessian, bool regulate)  //zjh

 {

    Int_t numSynapses=fSynapses->GetEntriesFast();

    InvHessian.ResizeTo( numSynapses, numSynapses );

    InvHessian=0;

    TMatrixD sens(numSynapses,1);

    TMatrixD sensT(1,numSynapses);

    Int_t nEvents = GetNEvents();

    for (Int_t i=0;i<nEvents;i++) {

       GetEvent(i);

       double outputValue=GetMvaValue(); // force calculation

       GetOutputNeuron()->SetError(1./fOutput->EvalDerivative(GetOutputNeuron()->GetValue()));

       CalculateNeuronDeltas();

       for (Int_t j = 0; j < numSynapses; j++){

          TSynapse* synapses = (TSynapse*)fSynapses->At(j);

          synapses->InitDelta();

          synapses->CalculateDelta();

          sens[j][0]=sensT[0][j]=synapses->GetDelta();

       }

       if (fEstimator==kMSE ) InvHessian+=sens*sensT;

       else if (fEstimator==kCE) InvHessian+=(outputValue*(1-outputValue))*sens*sensT;

    }


    // TVectorD eValue(numSynapses);

    if (regulate) {

       for (Int_t i = 0; i < numSynapses; i++){

          InvHessian[i][i]+=fRegulators[fRegulatorIdx[i]];

       }

    }

    else {

       for (Int_t i = 0; i < numSynapses; i++){

          InvHessian[i][i]+=1e-6; //to avoid precision problem that will destroy the pos-def

       }

    }


    InvHessian.Invert();


 }


 ////////////////////////////////////////////////////////////////////////////////


 Double_t TMVA::MethodMLP::GetMvaValue( Double_t* errLower, Double_t* errUpper )

 {

   Double_t MvaValue = MethodANNBase::GetMvaValue();// contains back propagation


    // no hessian (old training file) or no error reqested

    if (!fCalculateErrors || errLower==0 || errUpper==0)

       return MvaValue;


    Double_t MvaUpper,MvaLower,median,variance;

    Int_t numSynapses=fSynapses->GetEntriesFast();

    if (fInvHessian.GetNcols()!=numSynapses) {

       Log() << kWARNING << "inconsistent dimension " << fInvHessian.GetNcols() << " vs " << numSynapses << Endl;

    }

    TMatrixD sens(numSynapses,1);

    TMatrixD sensT(1,numSynapses);

    GetOutputNeuron()->SetError(1./fOutput->EvalDerivative(GetOutputNeuron()->GetValue()));

    //GetOutputNeuron()->SetError(1.);

    CalculateNeuronDeltas();

    for (Int_t i = 0; i < numSynapses; i++){

       TSynapse* synapses = (TSynapse*)fSynapses->At(i);

       synapses->InitDelta();

       synapses->CalculateDelta();

       sensT[0][i]=synapses->GetDelta();

    }

    sens.Transpose(sensT);

    TMatrixD sig=sensT*fInvHessian*sens;

    variance=sig[0][0];

    median=GetOutputNeuron()->GetValue();


    if (variance<0) {

      Log()<<kWARNING<<"Negative variance!!! median=" << median << "\tvariance(sigma^2)=" << variance <<Endl;

      variance=0;

    }

    variance=sqrt(variance);


    //upper

    MvaUpper=fOutput->Eval(median+variance);

    if(errUpper)

       *errUpper=MvaUpper-MvaValue;


    //lower

    MvaLower=fOutput->Eval(median-variance);

    if(errLower)

       *errLower=MvaValue-MvaLower;


    return MvaValue;

 }


 #ifdef MethodMLP_UseMinuit__


 ////////////////////////////////////////////////////////////////////////////////

 /// minimize using Minuit


 void TMVA::MethodMLP::MinuitMinimize()

 {

    fNumberOfWeights = fSynapses->GetEntriesFast();


    TFitter* tfitter = new TFitter( fNumberOfWeights );


    // minuit-specific settings

    Double_t args[10];


    // output level

    args[0] = 2; // put to 0 for results only, or to -1 for no garbage

    tfitter->ExecuteCommand( "SET PRINTOUT", args, 1 );

    tfitter->ExecuteCommand( "SET NOWARNINGS", args, 0 );


    double w[54];


    // init parameters

    for (Int_t ipar=0; ipar < fNumberOfWeights; ipar++) {

       TString parName = Form("w%i", ipar);

       tfitter->SetParameter( ipar,

                              parName, w[ipar], 0.1, 0, 0 );

    }


    // define the CFN function

    tfitter->SetFCN( &IFCN );


    // define fit strategy

    args[0] = 2;

    tfitter->ExecuteCommand( "SET STRATEGY", args, 1 );


    // now do the fit !

    args[0] = 1e-04;

    tfitter->ExecuteCommand( "MIGRAD", args, 1 );


    Bool_t doBetter     = kFALSE;

    Bool_t doEvenBetter = kFALSE;

    if (doBetter) {

       args[0] = 1e-04;

       tfitter->ExecuteCommand( "IMPROVE", args, 1 );


       if (doEvenBetter) {

          args[0] = 500;

          tfitter->ExecuteCommand( "MINOS", args, 1 );

       }

    }

 }


 _____________________________________________________________________________

 void TMVA::MethodMLP::IFCN( Int_t& npars, Double_t* grad, Double_t &f, Double_t* fitPars, Int_t iflag )

 {

    // Evaluate the minimisation function ----------------------------------------------------

    //

    //  Input parameters:

    //    npars:   number of currently variable parameters

    //             CAUTION: this is not (necessarily) the dimension of the fitPars vector !

    //    fitPars: array of (constant and variable) parameters

    //    iflag:   indicates what is to be calculated (see example below)

    //    grad:    array of gradients

    //

    //  Output parameters:

    //    f:       the calculated function value.

    //    grad:    the (optional) vector of first derivatives).

    // ---------------------------------------------------------------------------------------

    ((MethodMLP*)GetThisPtr())->FCN( npars, grad, f, fitPars, iflag );

 }


 TTHREAD_TLS(Int_t) nc   = 0;

 TTHREAD_TLS(double) minf = 1000000;


 void TMVA::MethodMLP::FCN( Int_t& npars, Double_t* grad, Double_t &f, Double_t* fitPars, Int_t iflag )

 {

    // first update the weights

    for (Int_t ipar=0; ipar<fNumberOfWeights; ipar++) {

       TSynapse* synapse = (TSynapse*)fSynapses->At(ipar);

       synapse->SetWeight(fitPars[ipar]);

    }


    // now compute the estimator

    f = CalculateEstimator();


    nc++;

    if (f < minf) minf = f;

    for (Int_t ipar=0; ipar<fNumberOfWeights; ipar++) Log() << kDEBUG << fitPars[ipar] << " ";

    Log() << kDEBUG << Endl;

    Log() << kDEBUG << "***** New estimator: " << f << "  min: " << minf << " --> ncalls: " << nc << Endl;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// global "this" pointer to be used in minuit


 TMVA::MethodMLP* TMVA::MethodMLP::GetThisPtr()

 {

    return fgThis;

 }


 #endif


 ////////////////////////////////////////////////////////////////////////////////

 /// write specific classifier response


 void TMVA::MethodMLP::MakeClassSpecific( std::ostream& fout, const TString& className ) const

 {

    MethodANNBase::MakeClassSpecific(fout, className);

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// get help message text

 ///

 /// typical length of text line:

 ///         "|--------------------------------------------------------------|"


 void TMVA::MethodMLP::GetHelpMessage() const

 {

    TString col    = gConfig().WriteOptionsReference() ? TString() : gTools().Color("bold");

    TString colres = gConfig().WriteOptionsReference() ? TString() : gTools().Color("reset");


    Log() << Endl;

    Log() << col << "--- Short description:" << colres << Endl;

    Log() << Endl;

    Log() << "The MLP artificial neural network (ANN) is a traditional feed-" << Endl;

    Log() << "forward multilayer perceptron impementation. The MLP has a user-" << Endl;

    Log() << "defined hidden layer architecture, while the number of input (output)" << Endl;

    Log() << "nodes is determined by the input variables (output classes, i.e., " << Endl;

    Log() << "signal and one background). " << Endl;

    Log() << Endl;

    Log() << col << "--- Performance optimisation:" << colres << Endl;

    Log() << Endl;

    Log() << "Neural networks are stable and performing for a large variety of " << Endl;

    Log() << "linear and non-linear classification problems. However, in contrast" << Endl;

    Log() << "to (e.g.) boosted decision trees, the user is advised to reduce the " << Endl;

    Log() << "number of input variables that have only little discrimination power. " << Endl;

    Log() << "" << Endl;

    Log() << "In the tests we have carried out so far, the MLP and ROOT networks" << Endl;

    Log() << "(TMlpANN, interfaced via TMVA) performed equally well, with however" << Endl;

    Log() << "a clear speed advantage for the MLP. The Clermont-Ferrand neural " << Endl;

    Log() << "net (CFMlpANN) exhibited worse classification performance in these" << Endl;

    Log() << "tests, which is partly due to the slow convergence of its training" << Endl;

    Log() << "(at least 10k training cycles are required to achieve approximately" << Endl;

    Log() << "competitive results)." << Endl;

    Log() << Endl;

    Log() << col << "Overtraining: " << colres

          << "only the TMlpANN performs an explicit separation of the" << Endl;

    Log() << "full training sample into independent training and validation samples." << Endl;

    Log() << "We have found that in most high-energy physics applications the " << Endl;

    Log() << "avaliable degrees of freedom (training events) are sufficient to " << Endl;

    Log() << "constrain the weights of the relatively simple architectures required" << Endl;

    Log() << "to achieve good performance. Hence no overtraining should occur, and " << Endl;

    Log() << "the use of validation samples would only reduce the available training" << Endl;

    Log() << "information. However, if the perrormance on the training sample is " << Endl;

    Log() << "found to be significantly better than the one found with the inde-" << Endl;

    Log() << "pendent test sample, caution is needed. The results for these samples " << Endl;

    Log() << "are printed to standard output at the end of each training job." << Endl;

    Log() << Endl;

    Log() << col << "--- Performance tuning via configuration options:" << colres << Endl;

    Log() << Endl;

    Log() << "The hidden layer architecture for all ANNs is defined by the option" << Endl;

    Log() << "\"HiddenLayers=N+1,N,...\", where here the first hidden layer has N+1" << Endl;

    Log() << "neurons and the second N neurons (and so on), and where N is the number  " << Endl;

    Log() << "of input variables. Excessive numbers of hidden layers should be avoided," << Endl;

    Log() << "in favour of more neurons in the first hidden layer." << Endl;

    Log() << "" << Endl;

    Log() << "The number of cycles should be above 500. As said, if the number of" << Endl;

    Log() << "adjustable weights is small compared to the training sample size," << Endl;

    Log() << "using a large number of training samples should not lead to overtraining." << Endl;

 }


TMatrixTBase::UnitMatrix
virtual TMatrixTBase< Element > & UnitMatrix()
Make a unit matrix (matrix need not be a square one).
Definition: TMatrixTBase.cxx:596

TMVA::MethodANNBase::GetMvaValue
virtual Double_t GetMvaValue(Double_t *err=0, Double_t *errUpper=0)
get the mva value generated by the NN
Definition: MethodANNBase.cxx:593

TMVA::MethodMLP::GetHelpMessage
void GetHelpMessage() const
get help message text
Definition: MethodMLP.cxx:1660

TH1::Fill
virtual Int_t Fill(Double_t x)
Increment bin with abscissa X by 1.
Definition: TH1.cxx:3159

TObjArray
An array of TObjects.
Definition: TObjArray.h:39

TMVA::MethodMLP::GetMSEErr
Double_t GetMSEErr(const Event *ev, UInt_t index=0)
Definition: MethodMLP.cxx:966

TMVA::kFATAL
Definition: Types.h:67

TSynapse.h

TMVA::Endl
MsgLogger & Endl(MsgLogger &ml)
Definition: MsgLogger.h:162

Types.h

TMatrixT::Transpose
TMatrixT< Element > & Transpose(const TMatrixT< Element > &source)
Transpose matrix source.
Definition: TMatrixT.cxx:1460

TMVA::Types
Definition: Types.h:74

TMVA::MethodMLP::~MethodMLP
virtual ~MethodMLP()
destructor nothing to be done
Definition: MethodMLP.cxx:127

TMVA::FitterBase
Definition: FitterBase.h:57

TMath::Log
Double_t Log(Double_t x)
Definition: TMath.h:526

TMVA::MethodMLP::Init
void Init()
default initializations
Definition: MethodMLP.cxx:146

TMVA::TNeuron::ForceValue
void ForceValue(Double_t value)
force the value, typically for input and bias neurons
Definition: TNeuron.cxx:87

TMVA::TSynapse::DecayLearningRate
void DecayLearningRate(Double_t rate)
Definition: TSynapse.h:68

TMVA::MethodMLP::GetError
Double_t GetError()
Definition: MethodMLP.cxx:929

Float_t
float Float_t
Definition: RtypesCore.h:53

TMVA::MethodMLP::UpdatePriors
void UpdatePriors()
Definition: MethodMLP.cxx:1399

TMVA::TSynapse::SetDEDw
void SetDEDw(Double_t DEDw)
Definition: TSynapse.h:91

TMVA::TSynapse
Definition: TSynapse.h:48

TMVA::gConfig
Config & gConfig()

TTree.h

TMVA::TSynapse::GetDelta
Double_t GetDelta()
Definition: TSynapse.h:93

TMVA::MethodMLP::TrainOneEpoch
void TrainOneEpoch()
train network over a single epoch/cyle of events
Definition: MethodMLP.cxx:1098

TMVA::Types::EAnalysisType
EAnalysisType
Definition: Types.h:124

TMVA::MethodMLP::SteepestDir
void SteepestDir(TMatrixD &Dir)
Definition: MethodMLP.cxx:737

MethodMLP.h

TMVA::MethodMLP::SetDir
void SetDir(TMatrixD &Hessian, TMatrixD &Dir)
Definition: MethodMLP.cxx:771

ROOT::TH1F
THist< 1, float > TH1F
Definition: THist.h:315

TMVA::Types::kMulticlass
Definition: Types.h:127

TString
Basic string class.
Definition: TString.h:137

TMVA::Types::kTesting
Definition: Types.h:142

Int_t
int Int_t
Definition: RtypesCore.h:41

Bool_t
bool Bool_t
Definition: RtypesCore.h:59

a
TArc * a
Definition: textangle.C:12

kFALSE
const Bool_t kFALSE
Definition: Rtypes.h:92

TMVA::MethodMLP::TrainOneEventFast
void TrainOneEventFast(Int_t ievt, Float_t *&branchVar, Int_t &type)
fast per-event training
Definition: MethodMLP.cxx:1177

TFitter::ExecuteCommand
virtual Int_t ExecuteCommand(const char *command, Double_t *args, Int_t nargs)
Execute a fitter command; command : command string args : list of nargs command arguments.
Definition: TFitter.cxx:86

TMVA::MethodMLP::DeclareOptions
void DeclareOptions()
define the options (their key words) that can be set in the option string know options: TrainingMetho...
Definition: MethodMLP.cxx:173

TMVA::MethodMLP::CalculateEstimator
Double_t CalculateEstimator(Types::ETreeType treeType=Types::kTraining, Int_t iEpoch=-1)
calculate the estimator that training is attempting to minimize
Definition: MethodMLP.cxx:270

TMath::Gamma
Double_t Gamma(Double_t z)
Computation of gamma(z) for all z.
Definition: TMath.cxx:352

std
STL namespace.

TObjArray::GetEntriesFast
Int_t GetEntriesFast() const
Definition: TObjArray.h:66

TMVA::MethodMLP::BFGSMinimize
void BFGSMinimize(Int_t nEpochs)
train network with BFGS algorithm
Definition: MethodMLP.cxx:459

GeneticFitter.h

TNeuron.h

TMVA::Event::GetWeight
Double_t GetWeight() const
return the event weight - depending on whether the flag IgnoreNegWeightsInTraining is or not...
Definition: Event.cxx:376

TMatrixT::ResizeTo
virtual TMatrixTBase< Element > & ResizeTo(Int_t nrows, Int_t ncols, Int_t=-1)
Set size of the matrix to nrows x ncols New dynamic elements are created, the overlapping part of the...
Definition: TMatrixT.cxx:1201

false
ClassImp(TIterator) Bool_t TIterator return false
Compare two iterator objects.
Definition: TIterator.cxx:20

Config.h

TMatrixT< Double_t >

TMVA::MethodMLP::SetDirWeights
void SetDirWeights(std::vector< Double_t > &Origin, TMatrixD &Dir, Double_t alpha)
Definition: MethodMLP.cxx:913

TString::Data
const char * Data() const
Definition: TString.h:349

Timer.h

sqrt
double sqrt(double)

TMVA::gTools
Tools & gTools()
Definition: Tools.cxx:79

TMVA::TNeuron::AdjustSynapseWeights
void AdjustSynapseWeights()
adjust the pre-synapses' weights for each neuron (input neuron has no pre-synapse) this method should...
Definition: TNeuron.cxx:268

timer
TStopwatch timer
Definition: pirndm.C:37

x
Double_t x[n]
Definition: legend1.C:17

TMVA::MethodMLP::Shuffle
void Shuffle(Int_t *index, Int_t n)
Input: index: the array to shuffle n: the size of the array Output: index: the shuffled indexes This ...
Definition: MethodMLP.cxx:1145

TMVA::FitterBase::Run
Double_t Run()
estimator function interface for fitting
Definition: FitterBase.cxx:73

FCN
void(* FCN)(Int_t &npar, Double_t *gin, Double_t &f, Double_t *u, Int_t flag)
Definition: testMinim.cxx:39

TMVA::kDEBUG
Definition: Types.h:62

TMVA::TNeuron
Definition: TNeuron.h:61

TMVA::TSynapse::CalculateDelta
void CalculateDelta()
calculate/adjust the error field for this synapse
Definition: TSynapse.cxx:111

TMVA::MethodMLP::GetApproxInvHessian
void GetApproxInvHessian(TMatrixD &InvHessian, bool regulate=true)
Definition: MethodMLP.cxx:1453

Data
std::vector< std::vector< double > > Data
Definition: ParallelTest.cxx:55

TMVA::MethodMLP::ComputeDEDw
void ComputeDEDw()
Definition: MethodMLP.cxx:660

TMVA::MethodANNBase::ProcessOptions
virtual void ProcessOptions()
do nothing specific at this moment
Definition: MethodANNBase.cxx:153

TMVA::DataSetInfo
Definition: DataSetInfo.h:78

TSynapse
Definition: TSynapse.h:32

TMVA::MethodMLP::TrainOneEvent
void TrainOneEvent(Int_t ievt)
train network over a single event this uses the new event model
Definition: MethodMLP.cxx:1213

TMVA::MethodMLP
Definition: MethodMLP.h:93

TMatrixT::Invert
TMatrixT< Element > & Invert(Double_t *det=0)
Invert the matrix and calculate its determinant.
Definition: TMatrixT.cxx:1387

TMVA::MethodMLP::UpdateSynapses
void UpdateSynapses()
update synapse error fields and adjust the weights (if in sequential mode)
Definition: MethodMLP.cxx:1357

TMVA::Event::GetTargets
std::vector< Float_t > & GetTargets()
Definition: Event.h:102

TMVA::MethodMLP::GetCEErr
Double_t GetCEErr(const Event *ev, UInt_t index=0)
Definition: MethodMLP.cxx:983

TMVA::MethodMLP::GeneticMinimize
void GeneticMinimize()
create genetics class similar to GeneticCut give it vector of parameter ranges (parameters = weights)...
Definition: MethodMLP.cxx:1301

TMVA::MethodMLP::MakeClassSpecific
void MakeClassSpecific(std::ostream &, const TString &) const
write specific classifier response
Definition: MethodMLP.cxx:1649

TMVA::Types::kRegression
Definition: Types.h:126

None
#define None
Definition: TGWin32.h:68

TMatrixD
TMatrixT< Double_t > TMatrixD
Definition: TMatrixDfwd.h:24

TString.h

TMVA::MethodMLP::InitializeLearningRates
void InitializeLearningRates()
initialize learning rates of synapses, used only by backpropagation
Definition: MethodMLP.cxx:256

TMVA::MethodMLP::DecaySynapseWeights
void DecaySynapseWeights(Bool_t lateEpoch)
decay synapse weights in last 10 epochs, lower learning rate even more to find a good minimum ...
Definition: MethodMLP.cxx:1163

nEvents
const int nEvents
Definition: testRooFit.cxx:42

TMVA::TSynapse::GetDEDw
Double_t GetDEDw()
Definition: TSynapse.h:92

TMVA::MethodMLP::GetDesiredOutput
Double_t GetDesiredOutput(const Event *ev)
get the desired output of this event
Definition: MethodMLP.cxx:1232

ROOT::Math::Cephes::gamma
double gamma(double x)
Definition: SpecFuncCephes.cxx:339

TMVA::TSynapse::SetLearningRate
void SetLearningRate(Double_t rate)
Definition: TSynapse.h:62

ROOT::Math::fabs
VecExpr< UnaryOp< Fabs< T >, VecExpr< A, T, D >, T >, T, D > fabs(const VecExpr< A, T, D > &rhs)
Definition: UnaryOperators.h:133

TMVA::MethodMLP::GetHessian
Bool_t GetHessian(TMatrixD &Hessian, TMatrixD &Gamma, TMatrixD &Delta)
Definition: MethodMLP.cxx:750

TMVA::MethodMLP::GetMvaValue
Double_t GetMvaValue(Double_t *err=0, Double_t *errUpper=0)
get the mva value generated by the NN
Definition: MethodMLP.cxx:1494

TMVA::MethodMLP::BackPropagationMinimize
void BackPropagationMinimize(Int_t nEpochs)
minimize estimator / train network with backpropagation algorithm
Definition: MethodMLP.cxx:1000

v
SVector< double, 2 > v
Definition: Dict.h:5

TMVA::Interval
Definition: Interval.h:63

TMVA::Event
Definition: Event.h:57

UInt_t
unsigned int UInt_t
Definition: RtypesCore.h:42

Form
char * Form(const char *fmt,...)

TMVA::Types::kClassification
Definition: Types.h:125

TMVA::MethodMLP::LineSearch
Bool_t LineSearch(TMatrixD &Dir, std::vector< Double_t > &Buffer, Double_t *dError=0)
Definition: MethodMLP.cxx:803

TMVA::Types::ETreeType
ETreeType
Definition: Types.h:140

TMVA::MethodMLP::UpdateNetwork
void UpdateNetwork(Double_t desired, Double_t eventWeight=1.0)
update the network based on how closely the output matched the desired output
Definition: MethodMLP.cxx:1242

TFitter::SetFCN
virtual void SetFCN(void *fcn)
Specify the address of the fitting algorithm (from the interpreter)
Definition: TFitter.cxx:545

Riostream.h

TMVA::TSynapse::GetWeight
Double_t GetWeight()
Definition: TSynapse.h:59

TSynapse::SetWeight
void SetWeight(Double_t w)
Sets the weight of the synapse.
Definition: TSynapse.cxx:105

TMVA::MethodMLP::SetGammaDelta
void SetGammaDelta(TMatrixD &Gamma, TMatrixD &Delta, std::vector< Double_t > &Buffer)
Definition: MethodMLP.cxx:635

ClassImp
#define ClassImp(name)
Definition: Rtypes.h:279

f
double f(double x)
Definition: testIntegration.cxx:12

TMVA::MethodMLP::CalculateNeuronDeltas
void CalculateNeuronDeltas()
have each neuron calculate its delta by backpropagation
Definition: MethodMLP.cxx:1273

Double_t
double Double_t
Definition: RtypesCore.h:55

TFitter
Definition: TFitter.h:30

TMVA::TSynapse::InitDelta
void InitDelta()
Definition: TSynapse.h:89

TDirectory
Describe directory structure in memory.
Definition: TDirectory.h:41

type
int type
Definition: TGX11.cxx:120

TFitter.h

TH1
The TH1 histogram class.
Definition: TH1.h:80

TMVA::MethodMLP::SimulateEvent
void SimulateEvent(const Event *ev)
Definition: MethodMLP.cxx:697

TMVA::MethodMLP::AdjustSynapseWeights
void AdjustSynapseWeights()
just adjust the synapse weights (should be called in batch mode)
Definition: MethodMLP.cxx:1379

TMVA::Event::GetClass
UInt_t GetClass() const
Definition: Event.h:86

TMVA::TNeuron::UpdateSynapsesSequential
void UpdateSynapsesSequential()
update the pre-synapses for each neuron (input neuron has no pre-synapse) this method should only be ...
Definition: TNeuron.cxx:247

TMVA::TNeuron::UpdateSynapsesBatch
void UpdateSynapsesBatch()
update and adjust the pre-synapses for each neuron (input neuron has no pre-synapse) this method shou...
Definition: TNeuron.cxx:229

name
#define name(a, b)
Definition: linkTestLib0.cpp:5

TMVA::TSynapse::SetWeight
void SetWeight(Double_t weight)
set synapse weight
Definition: TSynapse.cxx:71

TMVA::Tools::Color
const TString & Color(const TString &)
human readable color strings
Definition: Tools.cxx:837

TMVA::MethodMLP::HasAnalysisType
virtual Bool_t HasAnalysisType(Types::EAnalysisType type, UInt_t numberClasses, UInt_t numberTargets)
MLP can handle classification with 2 classes and regression with one regression-target.
Definition: MethodMLP.cxx:134

TMVA::Event::GetTarget
Float_t GetTarget(UInt_t itgt) const
Definition: Event.h:101

TMVA::MethodMLP::MethodMLP
MethodMLP(const TString &jobName, const TString &methodTitle, DataSetInfo &theData, const TString &theOption, TDirectory *theTargetDir=0)

TMatrixT< Double_t >::kTransposed
Definition: TMatrixT.h:59

REGISTER_METHOD
#define REGISTER_METHOD(CLASS)
for example
Definition: ClassifierFactory.h:126

TMVA
Abstract ClassifierFactory template that handles arbitrary types.
Definition: MethodPyAdaBoost.h:29

TMVA::Types::kTraining
Definition: Types.h:141

TMVA::MethodMLP::ProcessOptions
void ProcessOptions()
process user options
Definition: MethodMLP.cxx:225

Tools.h

TMatrixD.h

TMVA::MethodMLP::Train
void Train()
Definition: MethodMLP.h:112

TMVA::MethodMLP::EstimatorFunction
Double_t EstimatorFunction(std::vector< Double_t > &parameters)
interface to the estimate
Definition: MethodMLP.cxx:1330

TMVA::MethodMLP::ComputeEstimator
Double_t ComputeEstimator(std::vector< Double_t > &parameters)
this function is called by GeneticANN for GA optimization
Definition: MethodMLP.cxx:1338

TMVA::Timer::DrawProgressBar
void DrawProgressBar(Int_t, const TString &comment="")
draws progress bar in color or B&W caution:
Definition: Timer.cxx:183

TMVA::Config::WriteOptionsReference
Bool_t WriteOptionsReference() const
Definition: Config.h:66

TMVA::Tools::NormVariable
Double_t NormVariable(Double_t x, Double_t xmin, Double_t xmax)
normalise to output range: [-1, 1]
Definition: Tools.cxx:127

Interval.h

TMath::Sqrt
Double_t Sqrt(Double_t x)
Definition: TMath.h:464

TObjArray::At
TObject * At(Int_t idx) const
Definition: TObjArray.h:167

TMatrixT< Double_t >::kMult
Definition: TMatrixT.h:60

TMVA::MethodMLP::DerivDir
Double_t DerivDir(TMatrixD &Dir)
Definition: MethodMLP.cxx:788

TMVA::MethodMLP::UpdateRegulators
void UpdateRegulators()
Definition: MethodMLP.cxx:1413

TMath.h

exp
double exp(double)

output
static void output(int code)
Definition: gifencode.c:226

TMVA::kINFO
Definition: Types.h:64

kTRUE
const Bool_t kTRUE
Definition: Rtypes.h:91

TMVA::TNeuron::CalculateDelta
void CalculateDelta()
calculate error field
Definition: TNeuron.cxx:119

ClassifierFactory.h

norm
double norm(double *x, double *p)
Definition: unuranDistr.cxx:40

TMVA::MethodANNBase
Definition: MethodANNBase.h:80

TMVA::GeneticFitter
Definition: GeneticFitter.h:45

TMVA::MethodANNBase::MakeClassSpecific
virtual void MakeClassSpecific(std::ostream &, const TString &) const
write specific classifier response
Definition: MethodANNBase.cxx:1047

TMVA::kWARNING
Definition: Types.h:65

n
const Int_t n
Definition: legend1.C:16

TMVA::Timer
Definition: Timer.h:62

Log
Definition: math.cpp:60

TMatrixT< Double_t >::kTransposeMult
Definition: TMatrixT.h:60

TFitter::SetParameter
virtual Int_t SetParameter(Int_t ipar, const char *parname, Double_t value, Double_t verr, Double_t vlow, Double_t vhigh)
set initial values for a parameter ipar : parameter number parname : parameter name value : initial p...
Definition: TFitter.cxx:587