doc/v614/MethodDL_8h_source.html

 // @(#)root/tmva/tmva/dnn:$Id$
 // Author: Vladimir Ilievski, Saurav Shekhar

 /**********************************************************************************
  * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *
  * Package: TMVA                                                                  *
  * Class  : MethodDL                                                              *
  * Web    : http://tmva.sourceforge.net                                           *
  *                                                                                *
  * Description:                                                                   *
  *      Deep Neural Network Method                                                *
  *                                                                                *
  * Authors (alphabetical):                                                        *
  *      Vladimir Ilievski  <ilievski.vladimir@live.com> - CERN, Switzerland       *
  *      Saurav Shekhar     <sauravshekhar01@gmail.com> - ETH Zurich, Switzerland  *
  *                                                                                *
  * Copyright (c) 2005-2015:                                                       *
  *      CERN, Switzerland                                                         *
  *      U. of Victoria, Canada                                                    *
  *      MPI-K Heidelberg, Germany                                                 *
  *      U. of Bonn, Germany                                                       *
  *                                                                                *
  * Redistribution and use in source and binary forms, with or without             *
  * modification, are permitted according to the terms listed in LICENSE           *
  * (http://tmva.sourceforge.net/LICENSE)                                          *
  **********************************************************************************/

 #ifndef ROOT_TMVA_MethodDL
 #define ROOT_TMVA_MethodDL

 //////////////////////////////////////////////////////////////////////////
 //                                                                      //
 // MethodDL                                                             //
 //                                                                      //
 // Method class for all Deep Learning Networks                          //
 //                                                                      //
 //////////////////////////////////////////////////////////////////////////

 #include "TString.h"

 #include "TMVA/MethodBase.h"
 #include "TMVA/Types.h"

 #include "TMVA/DNN/Architectures/Reference.h"

 #ifdef R__HAS_TMVACPU
 #include "TMVA/DNN/Architectures/Cpu.h"
 #endif

 #ifdef R__HAS_TMVAGPU
 #include "TMVA/DNN/Architectures/Cuda.h"
 #endif

 #include "TMVA/DNN/Functions.h"
 #include "TMVA/DNN/DeepNet.h"

 #include <vector>

 namespace TMVA {

 /*! All of the options that can be specified in the training string */
 struct TTrainingSettings {
    size_t batchSize;
    size_t testInterval;
    size_t convergenceSteps;
    size_t maxEpochs;
    DNN::ERegularization regularization;
    Double_t learningRate;
    Double_t momentum;
    Double_t weightDecay;
    std::vector<Double_t> dropoutProbabilities;
    bool multithreading;
 };

 class MethodDL : public MethodBase {

 private:
    // Key-Value vector type, contining the values for the training options
    using KeyValueVector_t = std::vector<std::map<TString, TString>>;
 // #ifdef R__HAS_TMVAGPU
 //    using ArchitectureImpl_t = TMVA::DNN::TCuda<Double_t>;
 // #else
 // do not use arch GPU for evaluation. It is too slow for batch size=1
 #ifdef R__HAS_TMVACPU
    using ArchitectureImpl_t = TMVA::DNN::TCpu<Double_t>;
 #else
    using ArchitectureImpl_t = TMVA::DNN::TReference<Double_t>;
 #endif
 //#endif
    using DeepNetImpl_t = TMVA::DNN::TDeepNet<ArchitectureImpl_t>;
    std::unique_ptr<DeepNetImpl_t> fNet;

    /*! The option handling methods */
    void DeclareOptions();
    void ProcessOptions();

    void Init();

    // Function to parse the layout of the input
    void ParseInputLayout();
    void ParseBatchLayout();

    /*! After calling the ProcesOptions(), all of the options are parsed,
     *  so using the parsed options, and given the architecture and the
     *  type of the layers, we build the Deep Network passed as
     *  a reference in the function. */
    template <typename Architecture_t, typename Layer_t>
    void CreateDeepNet(DNN::TDeepNet<Architecture_t, Layer_t> &deepNet,
                       std::vector<DNN::TDeepNet<Architecture_t, Layer_t>> &nets);

    template <typename Architecture_t, typename Layer_t>
    void ParseDenseLayer(DNN::TDeepNet<Architecture_t, Layer_t> &deepNet,
                         std::vector<DNN::TDeepNet<Architecture_t, Layer_t>> &nets, TString layerString, TString delim);

    template <typename Architecture_t, typename Layer_t>
    void ParseConvLayer(DNN::TDeepNet<Architecture_t, Layer_t> &deepNet,
                        std::vector<DNN::TDeepNet<Architecture_t, Layer_t>> &nets, TString layerString, TString delim);

    template <typename Architecture_t, typename Layer_t>
    void ParseMaxPoolLayer(DNN::TDeepNet<Architecture_t, Layer_t> &deepNet,
                           std::vector<DNN::TDeepNet<Architecture_t, Layer_t>> &nets, TString layerString,
                           TString delim);

    template <typename Architecture_t, typename Layer_t>
    void ParseReshapeLayer(DNN::TDeepNet<Architecture_t, Layer_t> &deepNet,
                           std::vector<DNN::TDeepNet<Architecture_t, Layer_t>> &nets, TString layerString,
                           TString delim);

    template <typename Architecture_t, typename Layer_t>
    void ParseRnnLayer(DNN::TDeepNet<Architecture_t, Layer_t> &deepNet,
                       std::vector<DNN::TDeepNet<Architecture_t, Layer_t>> &nets, TString layerString, TString delim);

    template <typename Architecture_t, typename Layer_t>
    void ParseLstmLayer(DNN::TDeepNet<Architecture_t, Layer_t> &deepNet,
                        std::vector<DNN::TDeepNet<Architecture_t, Layer_t>> &nets, TString layerString, TString delim);

    template <typename Architecture_t>
    void TrainDeepNet();

    size_t fInputDepth;  ///< The depth of the input.
    size_t fInputHeight; ///< The height of the input.
    size_t fInputWidth;  ///< The width of the input.

    size_t fBatchDepth;  ///< The depth of the batch used to train the deep net.
    size_t fBatchHeight; ///< The height of the batch used to train the deep net.
    size_t fBatchWidth;  ///< The width of the batch used to train the deep net.

    size_t fRandomSeed;  ///<The random seed used to initialize the weights and shuffling batches (default is zero)

    DNN::EInitialization fWeightInitialization; ///< The initialization method
    DNN::EOutputFunction fOutputFunction;       ///< The output function for making the predictions
    DNN::ELossFunction fLossFunction;           ///< The loss function

    TString fInputLayoutString;          ///< The string defining the layout of the input
    TString fBatchLayoutString;          ///< The string defining the layout of the batch
    TString fLayoutString;               ///< The string defining the layout of the deep net
    TString fErrorStrategy;              ///< The string defining the error strategy for training
    TString fTrainingStrategyString;     ///< The string defining the training strategy
    TString fWeightInitializationString; ///< The string defining the weight initialization method
    TString fArchitectureString;         ///< The string defining the architecure: CPU or GPU
    bool fResume;
    bool fBuildNet;                     ///< Flag to control whether to build fNet, the stored network used for the evaluation

    KeyValueVector_t fSettings;                       ///< Map for the training strategy
    std::vector<TTrainingSettings> fTrainingSettings; ///< The vector defining each training strategy

    ClassDef(MethodDL, 0);

 protected:
    // provide a help message
    void GetHelpMessage() const;

 public:
    /*! Constructor */
    MethodDL(const TString &jobName, const TString &methodTitle, DataSetInfo &theData, const TString &theOption);

    /*! Constructor */
    MethodDL(DataSetInfo &theData, const TString &theWeightFile);

    /*! Virtual Destructor */
    virtual ~MethodDL();

    /*! Function for parsing the training settings, provided as a string
     *  in a key-value form.  */
    KeyValueVector_t ParseKeyValueString(TString parseString, TString blockDelim, TString tokenDelim);

    /*! Check the type of analysis the deep learning network can do */
    Bool_t HasAnalysisType(Types::EAnalysisType type, UInt_t numberClasses, UInt_t numberTargets);

    /*! Methods for training the deep learning network */
    void Train();

    Double_t GetMvaValue(Double_t *err = 0, Double_t *errUpper = 0);

    /*! Methods for writing and reading weights */
    using MethodBase::ReadWeightsFromStream;
    void AddWeightsXMLTo(void *parent) const;
    void ReadWeightsFromXML(void *wghtnode);
    void ReadWeightsFromStream(std::istream &);

    /* Create ranking */
    const Ranking *CreateRanking();

    /* Getters */
    size_t GetInputDepth() const { return fInputDepth; }
    size_t GetInputHeight() const { return fInputHeight; }
    size_t GetInputWidth() const { return fInputWidth; }

    size_t GetBatchDepth() const { return fBatchDepth; }
    size_t GetBatchHeight() const { return fBatchHeight; }
    size_t GetBatchWidth() const { return fBatchWidth; }

    const DeepNetImpl_t & GetDeepNet() const { return *fNet; }

    DNN::EInitialization GetWeightInitialization() const { return fWeightInitialization; }
    DNN::EOutputFunction GetOutputFunction() const { return fOutputFunction; }
    DNN::ELossFunction GetLossFunction() const { return fLossFunction; }

    TString GetInputLayoutString() const { return fInputLayoutString; }
    TString GetBatchLayoutString() const { return fBatchLayoutString; }
    TString GetLayoutString() const { return fLayoutString; }
    TString GetErrorStrategyString() const { return fErrorStrategy; }
    TString GetTrainingStrategyString() const { return fTrainingStrategyString; }
    TString GetWeightInitializationString() const { return fWeightInitializationString; }
    TString GetArchitectureString() const { return fArchitectureString; }

    const std::vector<TTrainingSettings> &GetTrainingSettings() const { return fTrainingSettings; }
    std::vector<TTrainingSettings> &GetTrainingSettings() { return fTrainingSettings; }
    const KeyValueVector_t &GetKeyValueSettings() const { return fSettings; }
    KeyValueVector_t &GetKeyValueSettings() { return fSettings; }

    /** Setters */
    void SetInputDepth(size_t inputDepth) { fInputDepth = inputDepth; }
    void SetInputHeight(size_t inputHeight) { fInputHeight = inputHeight; }
    void SetInputWidth(size_t inputWidth) { fInputWidth = inputWidth; }

    void SetBatchDepth(size_t batchDepth) { fBatchDepth = batchDepth; }
    void SetBatchHeight(size_t batchHeight) { fBatchHeight = batchHeight; }
    void SetBatchWidth(size_t batchWidth) { fBatchWidth = batchWidth; }

    void SetWeightInitialization(DNN::EInitialization weightInitialization)
    {
       fWeightInitialization = weightInitialization;
    }
    void SetOutputFunction(DNN::EOutputFunction outputFunction) { fOutputFunction = outputFunction; }
    void SetErrorStrategyString(TString errorStrategy) { fErrorStrategy = errorStrategy; }
    void SetTrainingStrategyString(TString trainingStrategyString) { fTrainingStrategyString = trainingStrategyString; }
    void SetWeightInitializationString(TString weightInitializationString)
    {
       fWeightInitializationString = weightInitializationString;
    }
    void SetArchitectureString(TString architectureString) { fArchitectureString = architectureString; }
    void SetLayoutString(TString layoutString) { fLayoutString = layoutString; }
 };

 } // namespace TMVA

 #endif
TMVA::MethodDL::SetBatchHeight
void SetBatchHeight(size_t batchHeight)
Definition: MethodDL.h:238

TMVA::TTrainingSettings::learningRate
Double_t learningRate
Definition: MethodDL.h:68

TMVA::MethodDL::GetLossFunction
DNN::ELossFunction GetLossFunction() const
Definition: MethodDL.h:217

TMVA::MethodDL::SetArchitectureString
void SetArchitectureString(TString architectureString)
Definition: MethodDL.h:252

TMVA::MethodDL::fLayoutString
TString fLayoutString
The string defining the layout of the deep net.
Definition: MethodDL.h:156

TMVA::DNN::TCpu
The TCpu architecture class.
Definition: Cpu.h:43

TMVA::MethodDL::SetInputDepth
void SetInputDepth(size_t inputDepth)
Setters.
Definition: MethodDL.h:233

Cpu.h

TMVA::MethodDL::SetWeightInitializationString
void SetWeightInitializationString(TString weightInitializationString)
Definition: MethodDL.h:248

TMVA::TTrainingSettings::testInterval
size_t testInterval
Definition: MethodDL.h:64

TMVA::MethodDL::GetTrainingSettings
std::vector< TTrainingSettings > & GetTrainingSettings()
Definition: MethodDL.h:228

TMVA::MethodDL::SetBatchWidth
void SetBatchWidth(size_t batchWidth)
Definition: MethodDL.h:239

TMVA::MethodDL::GetWeightInitialization
DNN::EInitialization GetWeightInitialization() const
Definition: MethodDL.h:215

TMVA::TTrainingSettings::multithreading
bool multithreading
Definition: MethodDL.h:72

TMVA::TTrainingSettings::maxEpochs
size_t maxEpochs
Definition: MethodDL.h:66

TMVA::Types::EAnalysisType
EAnalysisType
Definition: Types.h:127

TMVA::MethodBase
Virtual base Class for all MVA method.
Definition: MethodBase.h:109

TMVA::MethodDL::fOutputFunction
DNN::EOutputFunction fOutputFunction
The output function for making the predictions.
Definition: MethodDL.h:151

TMVA::MethodDL::fWeightInitialization
DNN::EInitialization fWeightInitialization
The initialization method.
Definition: MethodDL.h:150

TMVA::MethodDL::GetBatchWidth
size_t GetBatchWidth() const
Definition: MethodDL.h:211

TMVA::MethodDL::GetLayoutString
TString GetLayoutString() const
Definition: MethodDL.h:221

TString
Basic string class.
Definition: TString.h:131

TMVA::Ranking
Ranking for variables in method (implementation)
Definition: Ranking.h:48

Functions.h

Bool_t
bool Bool_t
Definition: RtypesCore.h:59

TMVA::MethodDL::SetOutputFunction
void SetOutputFunction(DNN::EOutputFunction outputFunction)
Definition: MethodDL.h:245

TMVA::MethodDL::fRandomSeed
size_t fRandomSeed
The random seed used to initialize the weights and shuffling batches (default is zero) ...
Definition: MethodDL.h:148

Reference.h

TMVA::MethodDL::SetErrorStrategyString
void SetErrorStrategyString(TString errorStrategy)
Definition: MethodDL.h:246

TMVA::MethodDL::fArchitectureString
TString fArchitectureString
The string defining the architecure: CPU or GPU.
Definition: MethodDL.h:160

TMVA::MethodDL::SetLayoutString
void SetLayoutString(TString layoutString)
Definition: MethodDL.h:253

TMVA::DNN::EInitialization
EInitialization
Definition: Functions.h:70

TMVA::MethodDL::SetWeightInitialization
void SetWeightInitialization(DNN::EInitialization weightInitialization)
Definition: MethodDL.h:241

TMVA::MethodDL::fInputDepth
size_t fInputDepth
The depth of the input.
Definition: MethodDL.h:140

ClassDef
#define ClassDef(name, id)
Definition: Rtypes.h:320

TMVA::DNN::TReference
The reference architecture class.
Definition: DataLoader.h:30

TClassEdit::Init
void Init(TClassEdit::TInterpreterLookupHelper *helper)
Definition: TClassEdit.cxx:121

TMVA::MethodDL::GetDeepNet
const DeepNetImpl_t & GetDeepNet() const
Definition: MethodDL.h:213

TMVA::MethodDL::fTrainingStrategyString
TString fTrainingStrategyString
The string defining the training strategy.
Definition: MethodDL.h:158

TMVA::MethodDL::fBuildNet
bool fBuildNet
Flag to control whether to build fNet, the stored network used for the evaluation.
Definition: MethodDL.h:162

TMVA::MethodDL::KeyValueVector_t
std::vector< std::map< TString, TString > > KeyValueVector_t
Definition: MethodDL.h:79

TMVA::MethodDL::SetBatchDepth
void SetBatchDepth(size_t batchDepth)
Definition: MethodDL.h:237

TMVA::MethodDL::fBatchLayoutString
TString fBatchLayoutString
The string defining the layout of the batch.
Definition: MethodDL.h:155

TMVA::DataSetInfo
Class that contains all the data information.
Definition: DataSetInfo.h:60

TMVA::MethodDL::GetBatchLayoutString
TString GetBatchLayoutString() const
Definition: MethodDL.h:220

TMVA::MethodDL::GetArchitectureString
TString GetArchitectureString() const
Definition: MethodDL.h:225

TMVA::MethodDL::SetTrainingStrategyString
void SetTrainingStrategyString(TString trainingStrategyString)
Definition: MethodDL.h:247

Types.h

TMVA::MethodDL::SetInputWidth
void SetInputWidth(size_t inputWidth)
Definition: MethodDL.h:235

TString.h

TMVA::TTrainingSettings
All of the options that can be specified in the training string.
Definition: MethodDL.h:62

TMVA::TTrainingSettings::weightDecay
Double_t weightDecay
Definition: MethodDL.h:70

TMVA::MethodDL::fInputWidth
size_t fInputWidth
The width of the input.
Definition: MethodDL.h:142

TMVA::MethodDL::GetWeightInitializationString
TString GetWeightInitializationString() const
Definition: MethodDL.h:224

TMVA::MethodDL::fLossFunction
DNN::ELossFunction fLossFunction
The loss function.
Definition: MethodDL.h:152

TMVA::TTrainingSettings::batchSize
size_t batchSize
Definition: MethodDL.h:63

TMVA::MethodDL::DeepNetImpl_t
TMVA::DNN::TDeepNet< ArchitectureImpl_t > DeepNetImpl_t
Definition: MethodDL.h:90

TMVA::TTrainingSettings::momentum
Double_t momentum
Definition: MethodDL.h:69

TMVA::MethodDL::GetErrorStrategyString
TString GetErrorStrategyString() const
Definition: MethodDL.h:222

TMVA::MethodDL::fTrainingSettings
std::vector< TTrainingSettings > fTrainingSettings
The vector defining each training strategy.
Definition: MethodDL.h:165

TMVA::MethodDL::GetTrainingSettings
const std::vector< TTrainingSettings > & GetTrainingSettings() const
Definition: MethodDL.h:227

TMVA::MethodDL::GetBatchDepth
size_t GetBatchDepth() const
Definition: MethodDL.h:209

TMVA::MethodDL::GetInputLayoutString
TString GetInputLayoutString() const
Definition: MethodDL.h:219

TMVA::MethodDL::GetInputDepth
size_t GetInputDepth() const
Definition: MethodDL.h:205

UInt_t
unsigned int UInt_t
Definition: RtypesCore.h:42

TMVA::MethodDL::fBatchDepth
size_t fBatchDepth
The depth of the batch used to train the deep net.
Definition: MethodDL.h:144

TMVA::TTrainingSettings::convergenceSteps
size_t convergenceSteps
Definition: MethodDL.h:65

TMVA::MethodDL::fSettings
KeyValueVector_t fSettings
Map for the training strategy.
Definition: MethodDL.h:164

TMVA::MethodDL::fErrorStrategy
TString fErrorStrategy
The string defining the error strategy for training.
Definition: MethodDL.h:157

TMVA::TTrainingSettings::regularization
DNN::ERegularization regularization
Definition: MethodDL.h:67

TMVA::MethodDL::fInputHeight
size_t fInputHeight
The height of the input.
Definition: MethodDL.h:141

TMVA::MethodDL::fResume
bool fResume
Definition: MethodDL.h:161

Double_t
double Double_t
Definition: RtypesCore.h:55

TMVA::DNN::EOutputFunction
EOutputFunction
Enum that represents output functions.
Definition: Functions.h:43

type
int type
Definition: TGX11.cxx:120

TMVA::DNN::ELossFunction
ELossFunction
Enum that represents objective functions for the net, i.e.
Definition: Functions.h:54

TMVA::MethodDL::SetInputHeight
void SetInputHeight(size_t inputHeight)
Definition: MethodDL.h:234

TMVA::MethodDL::GetTrainingStrategyString
TString GetTrainingStrategyString() const
Definition: MethodDL.h:223

TMVA::MethodDL::GetKeyValueSettings
const KeyValueVector_t & GetKeyValueSettings() const
Definition: MethodDL.h:229

TMVA::MethodDL::GetKeyValueSettings
KeyValueVector_t & GetKeyValueSettings()
Definition: MethodDL.h:230

TMVA::MethodDL
Definition: MethodDL.h:75

TMVA
Abstract ClassifierFactory template that handles arbitrary types.
Definition: GeneticMinimizer.h:21

TMVA::MethodDL::GetOutputFunction
DNN::EOutputFunction GetOutputFunction() const
Definition: MethodDL.h:216

Cuda.h

TMVA::MethodDL::fBatchHeight
size_t fBatchHeight
The height of the batch used to train the deep net.
Definition: MethodDL.h:145

TMVA::MethodDL::ArchitectureImpl_t
TMVA::DNN::TReference< Double_t > ArchitectureImpl_t
Definition: MethodDL.h:87

TMVA::TTrainingSettings::dropoutProbabilities
std::vector< Double_t > dropoutProbabilities
Definition: MethodDL.h:71

TMVA::MethodDL::fInputLayoutString
TString fInputLayoutString
The string defining the layout of the input.
Definition: MethodDL.h:154

TMVA::DNN::ERegularization
ERegularization
Enum representing the regularization type applied for a given layer.
Definition: Functions.h:62

TMVA::MethodBase::ReadWeightsFromStream
virtual void ReadWeightsFromStream(std::istream &)=0

TMVA::MethodDL::GetInputHeight
size_t GetInputHeight() const
Definition: MethodDL.h:206

MethodBase.h

TMVA::MethodDL::GetBatchHeight
size_t GetBatchHeight() const
Definition: MethodDL.h:210

TMVA::MethodDL::GetInputWidth
size_t GetInputWidth() const
Definition: MethodDL.h:207

TMVA::MethodDL::fBatchWidth
size_t fBatchWidth
The width of the batch used to train the deep net.
Definition: MethodDL.h:146

DeepNet.h

TMVA::MethodDL::fWeightInitializationString
TString fWeightInitializationString
The string defining the weight initialization method.
Definition: MethodDL.h:159

TMVA::MethodDL::fNet
std::unique_ptr< DeepNetImpl_t > fNet
Definition: MethodDL.h:91

TMVA::DNN::TDeepNet
Generic Deep Neural Network class.
Definition: DeepNet.h:74