doc/v620/Layer_8h_source.html

// @(#)root/tmva/tmva/dnn:$Id$

// Author: Simon Pfreundschuh 20/06/16


/*************************************************************************

 * Copyright (C) 2016, Simon Pfreundschuh                                *

 * All rights reserved.                                                  *

 *                                                                       *

 * For the licensing terms see $ROOTSYS/LICENSE.                         *

 * For the list of contributors see $ROOTSYS/README/CREDITS.             *

 *************************************************************************/


//////////////////////////////////////////////////////////////////////

// Contains Layer and SharedLayer classes, that represent layers in //

// neural networks.                                                 //

//////////////////////////////////////////////////////////////////////


#ifndef TMVA_DNN_LAYER

#define TMVA_DNN_LAYER


#include <iostream>


#include "TMatrix.h"

#include "Functions.h"


namespace TMVA

{

namespace DNN

{


//______________________________________________________________________________

//

//  The Layer Class

//______________________________________________________________________________


/** \class TLayer


    Generic layer class.


    This generic layer class represents a layer of a neural network with

    a given width n and activation function f. The activation

    function of each layer is given by \f$\mathbf{u} =

    \mathbf{W}\mathbf{x} + \boldsymbol{\theta}\f$.


    In addition to the weight and bias matrices, each layer allocates memory

    for its activations and the corresponding first partial fDerivatives of

    the activation function as well as the gradients of the fWeights and fBiases.


    The layer provides member functions for the forward propagation of

    activations through the given layer.

*/

template<typename Architecture_t>

   class TLayer

{


public:

   using Scalar_t = typename Architecture_t::Scalar_t;

   using Matrix_t = typename Architecture_t::Matrix_t;

   using Tensor_t = typename Architecture_t::Tensor_t;


private:


   size_t fBatchSize;  ///< Batch size used for training and evaluation.

   size_t fInputWidth; ///< Number of neurons of the previous layer.

   size_t fWidth;      ///< Number of neurons of this layer.


   Scalar_t fDropoutProbability;  ///< Probability that an input is active.


   Matrix_t fWeights;             ///< The fWeights of this layer.

   Matrix_t fBiases;              ///< The bias values of this layer.

   Matrix_t fOutput;              ///< Activations of this layer.

   Matrix_t fDerivatives;         ///< First fDerivatives of the activations of this layer.

   Matrix_t fWeightGradients;     ///< Gradients w.r.t. the weigths of this layer.

   Matrix_t fBiasGradients;       ///< Gradients w.r.t. the bias values of this layer.

   Matrix_t fActivationGradients; ///< Gradients w.r.t. the activations of this layer.


   EActivationFunction fF; ///< Activation function of the layer.


public:


   TLayer(size_t             BatchSize,

          size_t             InputWidth,

          size_t             Width,

          EActivationFunction f,

          Scalar_t           dropoutProbability);

   TLayer(const TLayer &);


   /*! Initialize fWeights according to the given initialization

    *  method. */

   void Initialize(EInitialization m);

   /*! Compute activation of the layer for the given input. The input

    * must be in matrix form with the different rows corresponding to

    * different events in the batch. Computes activations as well as

    * the first partial derivative of the activation function at those

    * activations. */

   void inline Forward(Matrix_t & input, bool applyDropout = false);

   /*! Compute weight, bias and activation gradients. Uses the precomputed

    *  first partial derviatives of the activation function computed during

    *  forward propagation and modifies them. Must only be called directly

    *  a the corresponding call to Forward(...). */

   void inline Backward(Matrix_t & gradients_backward,

                        const Matrix_t & activations_backward,

                        ERegularization r,

                        Scalar_t weightDecay);


   void Print() const;


   size_t GetBatchSize()          const {return fBatchSize;}

   size_t GetInputWidth()         const {return fInputWidth;}

   size_t GetWidth()              const {return fWidth;}

   size_t GetDropoutProbability() const {return fDropoutProbability;}


   void SetDropoutProbability(Scalar_t p) {fDropoutProbability = p;}


   EActivationFunction GetActivationFunction() const {return fF;}


   Matrix_t       & GetOutput()        {return fOutput;}

   const Matrix_t & GetOutput() const  {return fOutput;}

   Matrix_t       & GetWeights()       {return fWeights;}

   const Matrix_t & GetWeights() const {return fWeights;}

   Matrix_t       & GetBiases()       {return fBiases;}

   const Matrix_t & GetBiases() const {return fBiases;}

   Matrix_t       & GetActivationGradients()       {return fActivationGradients;}

   const Matrix_t & GetActivationGradients() const {return fActivationGradients;}

   Matrix_t       & GetBiasGradients()       {return fBiasGradients;}

   const Matrix_t & GetBiasGradients() const {return fBiasGradients;}

   Matrix_t       & GetWeightGradients()       {return fWeightGradients;}

   const Matrix_t & GetWeightGradients() const {return fWeightGradients;}


};


//______________________________________________________________________________

//

//  The Shared Layer Class

//______________________________________________________________________________


/** \class TSharedLayer


    Layer class width shared weight and bias layers.


    Like the Layer class only that weight matrices are shared between

    different instances of the net, which can be used to implement

    multithreading 'Hogwild' style.

*/


template<typename Architecture_t>

class TSharedLayer

{


public:


   using Scalar_t = typename Architecture_t::Scalar_t;

   using Matrix_t = typename Architecture_t::Matrix_t;

   using Tensor_t = typename Architecture_t::Tensor_t;


private:


   size_t fBatchSize;  ///< Batch size used for training and evaluation.

   size_t fInputWidth; ///< Number of neurons of the previous layer.

   size_t fWidth;      ///< Number of neurons of this layer.


   Scalar_t fDropoutProbability;  ///< Probability that an input is active.


   Matrix_t & fWeights;           ///< Reference to the weight matrix of this layer.

   Matrix_t & fBiases;            ///< Reference to the bias vectors of this layer.

   Matrix_t fOutput;              ///< Activations of this layer.

   Matrix_t fDerivatives;         ///< First fDerivatives of the activations of this layer.

   Matrix_t fWeightGradients;     ///< Gradients w.r.t. the weigths of this layer.

   Matrix_t fBiasGradients;       ///< Gradients w.r.t. the bias values of this layer.

   Matrix_t fActivationGradients; ///< Gradients w.r.t. the activations of this layer.


   EActivationFunction fF; ///< Activation function of the layer.


public:


   TSharedLayer(size_t fBatchSize,

                TLayer<Architecture_t> & layer);

   TSharedLayer(const TSharedLayer & layer);


   /*! Compute activation of the layer for the given input. The input

    * must be in matrix form with the different rows corresponding to

    * different events in the batch. Computes activations as well as

    * the first partial derivative of the activation function at those

    * activations. */

   void inline Forward(Matrix_t & input, bool applyDropout = false);

   /*! Compute weight, bias and activation gradients. Uses the precomputed

    *  first partial derviatives of the activation function computed during

    *  forward propagation and modifies them. Must only be called directly

    *  a the corresponding call to Forward(...). */

   void inline Backward(Matrix_t & gradients_backward,

                        const Matrix_t & activations_backward,

                        ERegularization r,

                        Scalar_t weightDecay);


   void Print() const;


   size_t GetBatchSize()          const {return fBatchSize;}

   size_t GetInputWidth()         const {return fInputWidth;}

   size_t GetWidth()              const {return fWidth;}

   size_t GetDropoutProbability() const {return fDropoutProbability;}


   void SetDropoutProbability(Scalar_t p) {fDropoutProbability = p;}


   EActivationFunction GetActivationFunction() const {return fF;}


   Matrix_t       & GetOutput()        {return fOutput;}

   const Matrix_t & GetOutput() const  {return fOutput;}

   Matrix_t       & GetWeights() const {return fWeights;}

   Matrix_t       & GetBiases()       {return fBiases;}

   const Matrix_t & GetBiases() const {return fBiases;}

   Matrix_t       & GetActivationGradients()       {return fActivationGradients;}

   const Matrix_t & GetActivationGradients() const {return fActivationGradients;}

   Matrix_t       & GetBiasGradients()       {return fBiasGradients;}

   const Matrix_t & GetBiasGradients() const {return fBiasGradients;}

   Matrix_t       & GetWeightGradients()       {return fWeightGradients;}

   const Matrix_t & GetWeightGradients() const {return fWeightGradients;}


};


//______________________________________________________________________________

//

//  The Layer Class - Implementation

//______________________________________________________________________________


template<typename Architecture_t>

   TLayer<Architecture_t>::TLayer(size_t batchSize,

                                  size_t inputWidth,

                                  size_t width,

                                  EActivationFunction f,

                                  Scalar_t dropoutProbability)

   : fBatchSize(batchSize), fInputWidth(inputWidth), fWidth(width),

     fDropoutProbability(dropoutProbability), fWeights(width, fInputWidth),

     fBiases(width, 1), fOutput(fBatchSize, width), fDerivatives(fBatchSize, width),

     fWeightGradients(width, fInputWidth), fBiasGradients(width, 1),

     fActivationGradients(fBatchSize, width), fF(f)

{

   // Nothing to do here.

}


//______________________________________________________________________________

template<typename Architecture_t>

TLayer<Architecture_t>::TLayer(const TLayer &layer)

    : fBatchSize(layer.fBatchSize), fInputWidth(layer.fInputWidth),

    fWidth(layer.fWidth), fDropoutProbability(layer.fDropoutProbability),

    fWeights(layer.fWidth, layer.fInputWidth), fBiases(layer.fWidth, 1),

    fOutput(layer.fBatchSize, layer.fWidth),

    fDerivatives(layer.fBatchSize, layer.fWidth),

    fWeightGradients(layer.fWidth, layer.fInputWidth),

    fBiasGradients(layer.fWidth, 1),

    fActivationGradients(layer.fBatchSize, layer.fWidth),

    fF(layer.fF)

{

   Architecture_t::Copy(fWeights, layer.GetWeights());

   Architecture_t::Copy(fBiases,  layer.GetBiases());

}


//______________________________________________________________________________

template<typename Architecture_t>

auto TLayer<Architecture_t>::Initialize(EInitialization m)

-> void

{

   initialize<Architecture_t>(fWeights, m);

   initialize<Architecture_t>(fBiases,  EInitialization::kZero);

}


//______________________________________________________________________________

template<typename Architecture_t>

auto inline TLayer<Architecture_t>::Forward(Matrix_t & input,

                                            bool applyDropout)

-> void

{

   if (applyDropout && (fDropoutProbability != 1.0)) {

      Architecture_t::DropoutForward(input, fDropoutProbability);

   }

   Architecture_t::MultiplyTranspose(fOutput, input, fWeights);

   Architecture_t::AddRowWise(fOutput, fBiases);

   Tensor_t tOutput(fOutput);

   Tensor_t tDerivatives(fDerivatives);

   evaluateDerivative<Architecture_t>(tDerivatives, fF, tOutput);


   evaluate<Architecture_t>(tOutput, fF);

}


//______________________________________________________________________________

template<typename Architecture_t>

auto TLayer<Architecture_t>::Backward(Matrix_t & gradients_backward,

                                    const Matrix_t & activations_backward,

                                    ERegularization r,

                                    Scalar_t weightDecay)

-> void

{


   Tensor_t tGradBw(gradients_backward);

   Tensor_t tActBw(activations_backward);

   Tensor_t tActGrad(fActivationGradients);

   Tensor_t tDeriv(fDerivatives);


   Architecture_t::Hadamard( tDeriv, tActGrad);

   Architecture_t::Backward( tGradBw,

                            fWeightGradients,

                            fBiasGradients,

                            tDeriv,

                            tActGrad,

                            fWeights,

                            tActBw);

   addRegularizationGradients<Architecture_t>(fWeightGradients,

                                              fWeights,

                                              weightDecay, r);

}


//______________________________________________________________________________

template<typename Architecture_t>

   void TLayer<Architecture_t>::Print() const

{

   std::cout << "Width = " << fWeights.GetNrows();

   std::cout << ", Activation Function = ";

   std::cout << static_cast<int>(fF) << std::endl;

}


//______________________________________________________________________________

//

//  The Shared Layer Class - Implementation

//______________________________________________________________________________


//______________________________________________________________________________

template<typename Architecture_t>

TSharedLayer<Architecture_t>::TSharedLayer(size_t BatchSize,

                                         TLayer<Architecture_t> &layer)

: fBatchSize(BatchSize),

fInputWidth(layer.GetInputWidth()), fWidth(layer.GetWidth()),

fDropoutProbability(layer.GetDropoutProbability()),

fWeights(layer.GetWeights()), fBiases(layer.GetBiases()),

fOutput(fBatchSize, fWidth), fDerivatives(fBatchSize, fWidth),

fWeightGradients(fWidth, fInputWidth), fBiasGradients(fWidth, 1),

fActivationGradients(fBatchSize, fWidth), fF(layer.GetActivationFunction())

{

   // Nothing to do here.

}


//______________________________________________________________________________

template<typename Architecture_t>

TSharedLayer<Architecture_t>::TSharedLayer(const TSharedLayer &layer)

    : fBatchSize(layer.fBatchSize),

    fInputWidth(layer.GetInputWidth()), fWidth(layer.GetWidth()),

    fDropoutProbability(layer.fDropoutProbability), fWeights(layer.fWeights),

    fBiases(layer.fBiases), fOutput(layer.fBatchSize, fWidth),

    fDerivatives(layer.fBatchSize, fWidth), fWeightGradients(fWidth, fInputWidth),

    fBiasGradients(fWidth, 1), fActivationGradients(layer.fBatchSize, fWidth),

    fF(layer.fF)

{

}


//______________________________________________________________________________

template<typename Architecture_t>

auto inline TSharedLayer<Architecture_t>::Forward(Matrix_t & input,

                                                  bool applyDropout)

-> void

{

   if (applyDropout && (fDropoutProbability != 1.0)) {

      Architecture_t::DropoutForward(input, fDropoutProbability);

   }

   Architecture_t::MultiplyTranspose(fOutput, input, fWeights);

   Architecture_t::AddRowWise(fOutput, fBiases);

   Tensor_t tOutput(fOutput);

   Tensor_t tDerivatives(fDerivatives);

   evaluateDerivative<Architecture_t>(tDerivatives, fF, tOutput);

   evaluate<Architecture_t>(tOutput, fF);

}


//______________________________________________________________________________

template<typename Architecture_t>

auto inline TSharedLayer<Architecture_t>::Backward(Matrix_t & gradients_backward,

                                                 const Matrix_t & activations_backward,

                                                 ERegularization r,

                                                 Scalar_t weightDecay)

-> void

{

   Architecture_t::Backward(gradients_backward,

                            fWeightGradients,

                            fBiasGradients,

                            fDerivatives,

                            fActivationGradients,

                            fWeights,

                            activations_backward);

   addRegularizationGradients<Architecture_t>(fWeightGradients,

                                              fWeights,

                                              weightDecay, r);

}


//______________________________________________________________________________

template<typename Architecture_t>

void TSharedLayer<Architecture_t>::Print() const

{

   std::cout << "Width = " << fWeights.GetNrows();

   std::cout << ", Activation Function = ";

   std::cout << static_cast<int>(fF) << std::endl;

}


} // namespace DNN

} // namespace TMVA


#endif

r
ROOT::R::TRInterface & r
Definition: Object.C:4

f
#define f(i)
Definition: RSha256.hxx:104

width
include TDocParser_001 C image html pict1_TDocParser_001 png width
Definition: TDocParser.cxx:121

TMatrix.h

TMVA::DNN::TLayer
Generic layer class.
Definition: Layer.h:53

TMVA::DNN::TLayer::Backward
void Backward(Matrix_t &gradients_backward, const Matrix_t &activations_backward, ERegularization r, Scalar_t weightDecay)
Compute weight, bias and activation gradients.
Definition: Layer.h:287

TMVA::DNN::TLayer::GetBiasGradients
const Matrix_t & GetBiasGradients() const
Definition: Layer.h:126

TMVA::DNN::TLayer::SetDropoutProbability
void SetDropoutProbability(Scalar_t p)
Definition: Layer.h:113

TMVA::DNN::TLayer::GetActivationGradients
const Matrix_t & GetActivationGradients() const
Definition: Layer.h:124

TMVA::DNN::TLayer::fF
EActivationFunction fF
Activation function of the layer.
Definition: Layer.h:77

TMVA::DNN::TLayer::GetWeights
Matrix_t & GetWeights()
Definition: Layer.h:119

TMVA::DNN::TLayer::fActivationGradients
Matrix_t fActivationGradients
Gradients w.r.t. the activations of this layer.
Definition: Layer.h:75

TMVA::DNN::TLayer::TLayer
TLayer(size_t BatchSize, size_t InputWidth, size_t Width, EActivationFunction f, Scalar_t dropoutProbability)
Definition: Layer.h:227

TMVA::DNN::TLayer::fInputWidth
size_t fInputWidth
Number of neurons of the previous layer.
Definition: Layer.h:64

TMVA::DNN::TLayer::fBiasGradients
Matrix_t fBiasGradients
Gradients w.r.t. the bias values of this layer.
Definition: Layer.h:74

TMVA::DNN::TLayer::GetBiases
const Matrix_t & GetBiases() const
Definition: Layer.h:122

TMVA::DNN::TLayer::GetOutput
const Matrix_t & GetOutput() const
Definition: Layer.h:118

TMVA::DNN::TLayer::fOutput
Matrix_t fOutput
Activations of this layer.
Definition: Layer.h:71

TMVA::DNN::TLayer::GetActivationFunction
EActivationFunction GetActivationFunction() const
Definition: Layer.h:115

TMVA::DNN::TLayer::GetWeightGradients
const Matrix_t & GetWeightGradients() const
Definition: Layer.h:128

TMVA::DNN::TLayer::GetBatchSize
size_t GetBatchSize() const
Definition: Layer.h:108

TMVA::DNN::TLayer::GetInputWidth
size_t GetInputWidth() const
Definition: Layer.h:109

TMVA::DNN::TLayer::GetBiasGradients
Matrix_t & GetBiasGradients()
Definition: Layer.h:125

TMVA::DNN::TLayer::fDropoutProbability
Scalar_t fDropoutProbability
Probability that an input is active.
Definition: Layer.h:67

TMVA::DNN::TLayer::fBiases
Matrix_t fBiases
The bias values of this layer.
Definition: Layer.h:70

TMVA::DNN::TLayer::GetActivationGradients
Matrix_t & GetActivationGradients()
Definition: Layer.h:123

TMVA::DNN::TLayer::fWidth
size_t fWidth
Number of neurons of this layer.
Definition: Layer.h:65

TMVA::DNN::TLayer::Matrix_t
typename Architecture_t::Matrix_t Matrix_t
Definition: Layer.h:57

TMVA::DNN::TLayer::GetOutput
Matrix_t & GetOutput()
Definition: Layer.h:117

TMVA::DNN::TLayer::Scalar_t
typename Architecture_t::Scalar_t Scalar_t
Definition: Layer.h:56

TMVA::DNN::TLayer::GetDropoutProbability
size_t GetDropoutProbability() const
Definition: Layer.h:111

TMVA::DNN::TLayer::Print
void Print() const
Definition: Layer.h:314

TMVA::DNN::TLayer::GetBiases
Matrix_t & GetBiases()
Definition: Layer.h:121

TMVA::DNN::TLayer::Tensor_t
typename Architecture_t::Tensor_t Tensor_t
Definition: Layer.h:58

TMVA::DNN::TLayer::fWeightGradients
Matrix_t fWeightGradients
Gradients w.r.t. the weigths of this layer.
Definition: Layer.h:73

TMVA::DNN::TLayer::fBatchSize
size_t fBatchSize
Batch size used for training and evaluation.
Definition: Layer.h:63

TMVA::DNN::TLayer::Initialize
void Initialize(EInitialization m)
Initialize fWeights according to the given initialization method.
Definition: Layer.h:260

TMVA::DNN::TLayer::fWeights
Matrix_t fWeights
The fWeights of this layer.
Definition: Layer.h:69

TMVA::DNN::TLayer::fDerivatives
Matrix_t fDerivatives
First fDerivatives of the activations of this layer.
Definition: Layer.h:72

TMVA::DNN::TLayer::GetWeightGradients
Matrix_t & GetWeightGradients()
Definition: Layer.h:127

TMVA::DNN::TLayer::GetWidth
size_t GetWidth() const
Definition: Layer.h:110

TMVA::DNN::TLayer::GetWeights
const Matrix_t & GetWeights() const
Definition: Layer.h:120

TMVA::DNN::TLayer::Forward
void Forward(Matrix_t &input, bool applyDropout=false)
Compute activation of the layer for the given input.
Definition: Layer.h:269

TMVA::DNN::TSharedLayer
Layer class width shared weight and bias layers.
Definition: Layer.h:148

TMVA::DNN::TSharedLayer::fBiases
Matrix_t & fBiases
Reference to the bias vectors of this layer.
Definition: Layer.h:166

TMVA::DNN::TSharedLayer::fOutput
Matrix_t fOutput
Activations of this layer.
Definition: Layer.h:167

TMVA::DNN::TSharedLayer::GetBiases
Matrix_t & GetBiases()
Definition: Layer.h:210

TMVA::DNN::TSharedLayer::TSharedLayer
TSharedLayer(size_t fBatchSize, TLayer< Architecture_t > &layer)
Definition: Layer.h:328

TMVA::DNN::TSharedLayer::fWeights
Matrix_t & fWeights
Reference to the weight matrix of this layer.
Definition: Layer.h:165

TMVA::DNN::TSharedLayer::GetActivationGradients
Matrix_t & GetActivationGradients()
Definition: Layer.h:212

TMVA::DNN::TSharedLayer::GetBiasGradients
const Matrix_t & GetBiasGradients() const
Definition: Layer.h:215

TMVA::DNN::TSharedLayer::GetWidth
size_t GetWidth() const
Definition: Layer.h:200

TMVA::DNN::TSharedLayer::fBiasGradients
Matrix_t fBiasGradients
Gradients w.r.t. the bias values of this layer.
Definition: Layer.h:170

TMVA::DNN::TSharedLayer::GetWeightGradients
Matrix_t & GetWeightGradients()
Definition: Layer.h:216

TMVA::DNN::TSharedLayer::Tensor_t
typename Architecture_t::Tensor_t Tensor_t
Definition: Layer.h:154

TMVA::DNN::TSharedLayer::fDerivatives
Matrix_t fDerivatives
First fDerivatives of the activations of this layer.
Definition: Layer.h:168

TMVA::DNN::TSharedLayer::GetBiases
const Matrix_t & GetBiases() const
Definition: Layer.h:211

TMVA::DNN::TSharedLayer::Matrix_t
typename Architecture_t::Matrix_t Matrix_t
Definition: Layer.h:153

TMVA::DNN::TSharedLayer::fInputWidth
size_t fInputWidth
Number of neurons of the previous layer.
Definition: Layer.h:160

TMVA::DNN::TSharedLayer::GetOutput
Matrix_t & GetOutput()
Definition: Layer.h:207

TMVA::DNN::TSharedLayer::fWidth
size_t fWidth
Number of neurons of this layer.
Definition: Layer.h:161

TMVA::DNN::TSharedLayer::GetWeightGradients
const Matrix_t & GetWeightGradients() const
Definition: Layer.h:217

TMVA::DNN::TSharedLayer::fBatchSize
size_t fBatchSize
Batch size used for training and evaluation.
Definition: Layer.h:159

TMVA::DNN::TSharedLayer::fWeightGradients
Matrix_t fWeightGradients
Gradients w.r.t. the weigths of this layer.
Definition: Layer.h:169

TMVA::DNN::TSharedLayer::GetActivationFunction
EActivationFunction GetActivationFunction() const
Definition: Layer.h:205

TMVA::DNN::TSharedLayer::fActivationGradients
Matrix_t fActivationGradients
Gradients w.r.t. the activations of this layer.
Definition: Layer.h:171

TMVA::DNN::TSharedLayer::GetDropoutProbability
size_t GetDropoutProbability() const
Definition: Layer.h:201

TMVA::DNN::TSharedLayer::GetInputWidth
size_t GetInputWidth() const
Definition: Layer.h:199

TMVA::DNN::TSharedLayer::Print
void Print() const
Definition: Layer.h:393

TMVA::DNN::TSharedLayer::GetBatchSize
size_t GetBatchSize() const
Definition: Layer.h:198

TMVA::DNN::TSharedLayer::Forward
void Forward(Matrix_t &input, bool applyDropout=false)
Compute activation of the layer for the given input.
Definition: Layer.h:356

TMVA::DNN::TSharedLayer::Scalar_t
typename Architecture_t::Scalar_t Scalar_t
Definition: Layer.h:152

TMVA::DNN::TSharedLayer::fF
EActivationFunction fF
Activation function of the layer.
Definition: Layer.h:173

TMVA::DNN::TSharedLayer::fDropoutProbability
Scalar_t fDropoutProbability
Probability that an input is active.
Definition: Layer.h:163

TMVA::DNN::TSharedLayer::GetWeights
Matrix_t & GetWeights() const
Definition: Layer.h:209

TMVA::DNN::TSharedLayer::GetOutput
const Matrix_t & GetOutput() const
Definition: Layer.h:208

TMVA::DNN::TSharedLayer::GetActivationGradients
const Matrix_t & GetActivationGradients() const
Definition: Layer.h:213

TMVA::DNN::TSharedLayer::GetBiasGradients
Matrix_t & GetBiasGradients()
Definition: Layer.h:214

TMVA::DNN::TSharedLayer::SetDropoutProbability
void SetDropoutProbability(Scalar_t p)
Definition: Layer.h:203

TMVA::DNN::TSharedLayer::Backward
void Backward(Matrix_t &gradients_backward, const Matrix_t &activations_backward, ERegularization r, Scalar_t weightDecay)
Compute weight, bias and activation gradients.
Definition: Layer.h:373

ROOT::Math::GSLSimAn::Copy
void Copy(void *source, void *dest)
Definition: GSLSimAnnealing.cxx:149

TMVA::DNN::EInitialization
EInitialization
Definition: Functions.h:70

TMVA::DNN::EInitialization::kZero
@ kZero

TMVA::DNN::weightDecay
double weightDecay(double error, ItWeight itWeight, ItWeight itWeightEnd, double factorWeightDecay, EnumRegularization eRegularization)
compute the weight decay for regularization (L1 or L2)
Definition: NeuralNet.icc:498

TMVA::DNN::ERegularization
ERegularization
Enum representing the regularization type applied for a given layer.
Definition: Functions.h:63

TMVA::DNN::EActivationFunction
EActivationFunction
Enum that represents layer activation functions.
Definition: Functions.h:32

TMVA
create variable transformations
Definition: GeneticMinimizer.h:21

m
auto * m
Definition: textangle.C:8

Functions.h