doc/v622/NeuralNet_8h_source.html

/**

 * @file NeuralNet

 * @author  Peter Speckmayer

 * @version 1.0

 *

 * @section LICENSE

 *

 *

 * @section Neural net implementation

 *

 * An implementation of a neural net for TMVA. This neural net uses multithreading

 *

 */


//////////////////////////////////////////////////////////////////////////

//                                                                      //

// NeuralNet                                                            //

//                                                                      //

// A neural net implementation                                          //

//                                                                      //

//////////////////////////////////////////////////////////////////////////


#ifndef TMVA_NEURAL_NET

#define TMVA_NEURAL_NET

#pragma once


#include <vector>

#include <iostream>

#include <fstream>

#include <algorithm>

#include <iterator>

#include <functional>

#include <tuple>

#include <cmath>

#include <cassert>

#include <random>

#include <thread>

#include <future>

#include <type_traits>


#include "Pattern.h"

#include "Monitoring.h"


#include "TApplication.h"

#include "Timer.h"


#include "TH1F.h"

#include "TH2F.h"


#include <fenv.h> // turn on or off exceptions for NaN and other numeric exceptions


namespace TMVA

{


  class IPythonInteractive;


   namespace DNN

   {


      //    double gaussDoubl (edouble mean, double sigma);


      double gaussDouble (double mean, double sigma);

      double uniformDouble (double minValue, double maxValue);

      int randomInt (int maxValue);


      class MeanVariance

      {

      public:

      MeanVariance()

          : m_n(0)

              , m_sumWeights(0)

              , m_mean(0)

              , m_squared(0)

          {}


          inline void clear()

          {

              m_n = 0;

              m_sumWeights = 0;

              m_mean = 0;

              m_squared = 0;

          }


          template <typename T>

              inline void add(T value, double weight = 1.0)

          {

              ++m_n; // a value has been added


              if (m_n == 1) // initialization

              {

                  m_mean = value;

                  m_squared = 0.0;

                  m_sumWeights = weight;

                  return;

              }


              double tmpWeight = m_sumWeights+weight;

              double Q      = value - m_mean;


              double R = Q*weight/tmpWeight;

              m_mean    += R;

              m_squared += m_sumWeights*R*Q;


              m_sumWeights = tmpWeight;

          }


          template <typename ITERATOR>

              inline void add (ITERATOR itBegin, ITERATOR itEnd)

          {

              for (ITERATOR it = itBegin; it != itEnd; ++it)

                  add (*it);

          }


          inline int    count()      const { return m_n; }

          inline double weights()    const { if(m_n==0) return 0; return m_sumWeights; }

          inline double mean()       const { if(m_n==0) return 0; return m_mean; }

          inline double var() const

          {

              if(m_n==0)

                  return 0;

              if (m_squared <= 0)

                  return 0;

              return (m_squared/m_sumWeights);

          }


          inline double var_corr ()   const

          {

              if (m_n <= 1)

                  return var ();


              return (var()*m_n/(m_n-1));    // unbiased for small sample sizes

          }


          inline double stdDev_corr () const { return sqrt( var_corr() ); }

          inline double stdDev ()   const { return sqrt( var() ); } // unbiased for small sample sizes


      private:

          size_t m_n;

          double m_sumWeights;

          double m_mean;

          double m_squared;

      };


      enum class EnumFunction

      {

         ZERO = '0',

            LINEAR = 'L',

            TANH = 'T',

            RELU = 'R',

            SYMMRELU = 'r',

            TANHSHIFT = 't',

            SIGMOID = 's',

            SOFTSIGN = 'S',

            GAUSS = 'G',

            GAUSSCOMPLEMENT = 'C'

            };


      enum class EnumRegularization

      {

         NONE, L1, L2, L1MAX

            };


      enum class ModeOutputValues : int

         {

            DIRECT = 0x01,

               SIGMOID = 0x02,

               SOFTMAX = 0x04,

               BATCHNORMALIZATION = 0x08

               };


      inline ModeOutputValues operator| (ModeOutputValues lhs, ModeOutputValues rhs)

      {

         return (ModeOutputValues)(static_cast<std::underlying_type<ModeOutputValues>::type>(lhs) | static_cast<std::underlying_type<ModeOutputValues>::type>(rhs));

      }


      inline ModeOutputValues operator|= (ModeOutputValues& lhs, ModeOutputValues rhs)

      {

         lhs = (ModeOutputValues)(static_cast<std::underlying_type<ModeOutputValues>::type>(lhs) | static_cast<std::underlying_type<ModeOutputValues>::type>(rhs));

         return lhs;

      }


      inline ModeOutputValues operator& (ModeOutputValues lhs, ModeOutputValues rhs)

      {

         return (ModeOutputValues)(static_cast<std::underlying_type<ModeOutputValues>::type>(lhs) & static_cast<std::underlying_type<ModeOutputValues>::type>(rhs));

      }


      inline ModeOutputValues operator&= (ModeOutputValues& lhs, ModeOutputValues rhs)

      {

         lhs = (ModeOutputValues)(static_cast<std::underlying_type<ModeOutputValues>::type>(lhs) & static_cast<std::underlying_type<ModeOutputValues>::type>(rhs));

         return lhs;

      }


      template <typename T>

         bool isFlagSet (T flag, T value)

         {

            return (int)(value & flag) != 0;

         }


      class Net;


      typedef std::vector<char> DropContainer;


      /*! \brief The Batch class encapsulates one mini-batch

       *

       *  Holds a const_iterator to the beginning and the end of one batch in a vector of Pattern

       */

      class Batch

      {

      public:

         typedef typename std::vector<Pattern>::const_iterator const_iterator;


         Batch (typename std::vector<Pattern>::const_iterator itBegin, typename std::vector<Pattern>::const_iterator itEnd)

            : m_itBegin (itBegin)

            , m_itEnd (itEnd)

         {}


         const_iterator begin () const { return m_itBegin; }

         const_iterator end   () const { return m_itEnd; }


         size_t size () const { return std::distance (begin (), end ()); }


      private:

         const_iterator m_itBegin; ///< iterator denoting the beginning of the batch

         const_iterator m_itEnd;   ///< iterator denoting the end of the batch

      };


      template <typename ItSource, typename ItWeight, typename ItTarget>

         void applyWeights (ItSource itSourceBegin, ItSource itSourceEnd, ItWeight itWeight, ItTarget itTargetBegin, ItTarget itTargetEnd);


      template <typename ItSource, typename ItWeight, typename ItPrev>

         void applyWeightsBackwards (ItSource itCurrBegin, ItSource itCurrEnd, ItWeight itWeight, ItPrev itPrevBegin, ItPrev itPrevEnd);


      template <typename ItValue, typename ItFunction>

         void applyFunctions (ItValue itValue, ItValue itValueEnd, ItFunction itFunction);


      template <typename ItValue, typename ItFunction, typename ItInverseFunction, typename ItGradient>

         void applyFunctions (ItValue itValue, ItValue itValueEnd, ItFunction itFunction, ItInverseFunction itInverseFunction, ItGradient itGradient);


      template <typename ItSource, typename ItDelta, typename ItTargetGradient, typename ItGradient>

         void update (ItSource itSource, ItSource itSourceEnd,

                      ItDelta itTargetDeltaBegin, ItDelta itTargetDeltaEnd,

                      ItTargetGradient itTargetGradientBegin,

                      ItGradient itGradient);


      template <EnumRegularization Regularization, typename ItSource, typename ItDelta, typename ItTargetGradient, typename ItGradient, typename ItWeight>

         void update (ItSource itSource, ItSource itSourceEnd,

                      ItDelta itTargetDeltaBegin, ItDelta itTargetDeltaEnd,

                      ItTargetGradient itTargetGradientBegin,

                      ItGradient itGradient,

                      ItWeight itWeight, double weightDecay);


      // ----- signature of a minimizer -------------

      // class Minimizer

      // {

      // public:


      //     template <typename Function, typename Variables, typename PassThrough>

      //     double operator() (Function& fnc, Variables& vars, PassThrough& passThrough)

      //     {

      //         // auto itVars = begin (vars);

      //         // auto itVarsEnd = end (vars);


      //         std::vector<double> myweights;

      //         std::vector<double> gradients;


      //         double value = fnc (passThrough, myweights);

      //         value = fnc (passThrough, myweights, gradients);

      //         return value;

      //     }

      // };


      ///< list all the minimizer types

      enum MinimizerType

      {

         fSteepest ///< SGD

      };


      /*! \brief Steepest Gradient Descent algorithm (SGD)

       *

       *  Implements a steepest gradient descent minimization algorithm

       */

      class Steepest

      {

      public:


         size_t m_repetitions;


         /*! \brief c'tor

          *

          *  C'tor

          *

          * \param learningRate denotes the learning rate for the SGD algorithm

          * \param momentum fraction of the velocity which is taken over from the last step

          * \param repetitions re-compute the gradients each "repetitions" steps

          */

         Steepest (double learningRate = 1e-4,

                   double momentum = 0.5,

                   size_t repetitions = 10)

            : m_repetitions (repetitions)

            , m_alpha (learningRate)

            , m_beta (momentum)

         {}


         /*! \brief operator to call the steepest gradient descent algorithm

          *

          *  entry point to start the minimization procedure

          *

          * \param fitnessFunction (templated) function which has to be provided. This function is minimized

          * \param weights (templated) a reference to a container of weights. The result of the minimization procedure

          *                is returned via this reference (needs to support std::begin and std::end

          * \param passThrough (templated) object which can hold any data which the fitness function needs. This object

          *                    is not touched by the minimizer; This object is provided to the fitness function when

          *                    called

          */

         template <typename Function, typename Weights, typename PassThrough>

            double operator() (Function& fitnessFunction, Weights& weights, PassThrough& passThrough);


         double m_alpha; ///< internal parameter (learningRate)

         double m_beta;  ///< internal parameter (momentum)

         std::vector<double> m_prevGradients; ///< vector remembers the gradients of the previous step


         std::vector<double> m_localWeights; ///< local weights for reuse in thread.

         std::vector<double> m_localGradients; ///< local gradients for reuse in thread.

      };


      template <typename ItOutput, typename ItTruth, typename ItDelta, typename ItInvActFnc>

         double sumOfSquares (ItOutput itOutputBegin, ItOutput itOutputEnd, ItTruth itTruthBegin, ItTruth itTruthEnd, ItDelta itDelta, ItDelta itDeltaEnd, ItInvActFnc itInvActFnc, double patternWeight);


      template <typename ItProbability, typename ItTruth, typename ItDelta, typename ItInvActFnc>

         double crossEntropy (ItProbability itProbabilityBegin, ItProbability itProbabilityEnd, ItTruth itTruthBegin, ItTruth itTruthEnd, ItDelta itDelta, ItDelta itDeltaEnd, ItInvActFnc itInvActFnc, double patternWeight);


      template <typename ItOutput, typename ItTruth, typename ItDelta, typename ItInvActFnc>

         double softMaxCrossEntropy (ItOutput itProbabilityBegin, ItOutput itProbabilityEnd, ItTruth itTruthBegin, ItTruth itTruthEnd, ItDelta itDelta, ItDelta itDeltaEnd, ItInvActFnc itInvActFnc, double patternWeight);


      template <typename ItWeight>

         double weightDecay (double error, ItWeight itWeight, ItWeight itWeightEnd, double factorWeightDecay, EnumRegularization eRegularization);


      /*! \brief LayerData holds the data of one layer

       *

       *     LayerData holds the data of one layer, but not its layout

       *

       *

       */

      class LayerData

      {

      public:

         typedef std::vector<double> container_type;


         typedef container_type::iterator iterator_type;

         typedef container_type::const_iterator const_iterator_type;


         typedef std::vector<std::function<double(double)> > function_container_type;

         typedef function_container_type::iterator function_iterator_type;

         typedef function_container_type::const_iterator const_function_iterator_type;


         typedef DropContainer::const_iterator const_dropout_iterator;


         /*! \brief c'tor of LayerData

          *

          *  C'tor of LayerData for the input layer

          *

          * \param itInputBegin iterator to the begin of a vector which holds the values of the nodes of the neural net

          * \param itInputEnd iterator to the end of a vector which holdsd the values of the nodes of the neural net

          * \param eModeOutput indicates a potential tranformation of the output values before further computation

          *                    DIRECT does not further transformation; SIGMOID applies a sigmoid transformation to each

          *                    output value (to create a probability); SOFTMAX applies a softmax transformation to all

          *                    output values (mutually exclusive probability)

          */

         LayerData (const_iterator_type itInputBegin, const_iterator_type itInputEnd, ModeOutputValues eModeOutput = ModeOutputValues::DIRECT);


         /*! \brief c'tor of LayerData

          *

          *  C'tor of LayerData for the input layer

          *

          * \param inputSize input size of this layer

          */

         LayerData  (size_t inputSize);

         ~LayerData ()    {}


         /*! \brief c'tor of LayerData

          *

          *  C'tor of LayerData for all layers which are not the input layer; Used during the training of the DNN

          *

          * \param size size of the layer

          * \param itWeightBegin indicates the start of the weights for this layer on the weight vector

          * \param itGradientBegin indicates the start of the gradients for this layer on the gradient vector

          * \param itFunctionBegin indicates the start of the vector of activation functions for this layer on the

          *                        activation function vector

          * \param itInverseFunctionBegin indicates the start of the vector of activation functions for this

          *                               layer on the activation function vector

          * \param eModeOutput indicates a potential tranformation of the output values before further computation

          *                    DIRECT does not further transformation; SIGMOID applies a sigmoid transformation to each

          *                    output value (to create a probability); SOFTMAX applies a softmax transformation to all

          *                    output values (mutually exclusive probability)

          */

         LayerData (size_t size,

                    const_iterator_type itWeightBegin,

                    iterator_type itGradientBegin,

                    std::shared_ptr<std::function<double(double)>> activationFunction,

                    std::shared_ptr<std::function<double(double)>> inverseActivationFunction,

                    ModeOutputValues eModeOutput = ModeOutputValues::DIRECT);


         /*! \brief c'tor of LayerData

          *

          *  C'tor of LayerData for all layers which are not the input layer; Used during the application of the DNN

          *

          * \param size size of the layer

          * \param itWeightBegin indicates the start of the weights for this layer on the weight vector

          * \param itFunctionBegin indicates the start of the vector of activation functions for this layer on the

          *                        activation function vector

          * \param eModeOutput indicates a potential tranformation of the output values before further computation

          *                    DIRECT does not further transformation; SIGMOID applies a sigmoid transformation to each

          *                    output value (to create a probability); SOFTMAX applies a softmax transformation to all

          *                    output values (mutually exclusive probability)

          */

         LayerData (size_t size, const_iterator_type itWeightBegin,

                    std::shared_ptr<std::function<double(double)>> activationFunction,

                    ModeOutputValues eModeOutput = ModeOutputValues::DIRECT);


         /*! \brief copy c'tor of LayerData

          *

          *

          */

         LayerData (const LayerData& other)

            : m_size (other.m_size)

            , m_itInputBegin (other.m_itInputBegin)

            , m_itInputEnd (other.m_itInputEnd)

            , m_deltas (other.m_deltas)

            , m_valueGradients (other.m_valueGradients)

            , m_values (other.m_values)

        , m_itDropOut (other.m_itDropOut)

        , m_hasDropOut (other.m_hasDropOut)

            , m_itConstWeightBegin   (other.m_itConstWeightBegin)

            , m_itGradientBegin (other.m_itGradientBegin)

            , m_activationFunction (other.m_activationFunction)

            , m_inverseActivationFunction (other.m_inverseActivationFunction)

            , m_isInputLayer (other.m_isInputLayer)

            , m_hasWeights (other.m_hasWeights)

            , m_hasGradients (other.m_hasGradients)

            , m_eModeOutput (other.m_eModeOutput)

            {}


         /*! \brief move c'tor of LayerData

          *

          *

          */

         LayerData (LayerData&& other)

            : m_size (other.m_size)

            , m_itInputBegin (other.m_itInputBegin)

            , m_itInputEnd (other.m_itInputEnd)

        , m_deltas (std::move(other.m_deltas))

        , m_valueGradients (std::move(other.m_valueGradients))

        , m_values (std::move(other.m_values))

        , m_itDropOut (other.m_itDropOut)

        , m_hasDropOut (other.m_hasDropOut)

            , m_itConstWeightBegin   (other.m_itConstWeightBegin)

            , m_itGradientBegin (other.m_itGradientBegin)

        , m_activationFunction (std::move(other.m_activationFunction))

        , m_inverseActivationFunction (std::move(other.m_inverseActivationFunction))

            , m_isInputLayer (other.m_isInputLayer)

            , m_hasWeights (other.m_hasWeights)

            , m_hasGradients (other.m_hasGradients)

            , m_eModeOutput (other.m_eModeOutput)

            {}


         /*! \brief change the input iterators

          *

          *

          * \param itInputBegin indicates the start of the input node vector

          * \param itInputEnd indicates the end of the input node vector

          *

          */

         void setInput (const_iterator_type itInputBegin, const_iterator_type itInputEnd)

         {

            m_isInputLayer = true;

            m_itInputBegin = itInputBegin;

            m_itInputEnd = itInputEnd;

         }


         /*! \brief clear the values and the deltas

          *

          *

          */

         void clear ()

         {

            m_values.assign (m_values.size (), 0.0);

            m_deltas.assign (m_deltas.size (), 0.0);

         }


         const_iterator_type valuesBegin () const { return m_isInputLayer ? m_itInputBegin : begin (m_values); } ///< returns const iterator to the begin of the (node) values

         const_iterator_type valuesEnd   () const { return m_isInputLayer ? m_itInputEnd   : end (m_values); } ///< returns iterator to the end of the (node) values


         iterator_type valuesBegin () { assert (!m_isInputLayer); return begin (m_values); }  ///< returns iterator to the begin of the (node) values

         iterator_type valuesEnd   () { assert (!m_isInputLayer); return end (m_values); } ///< returns iterator to the end of the (node) values


         ModeOutputValues outputMode () const { return m_eModeOutput; } ///< returns the output mode

    container_type probabilities () const { return computeProbabilities (); } ///< computes the probabilities from the current node values and returns them


         iterator_type deltasBegin () { return begin (m_deltas); } ///< returns iterator to the begin of the deltas (back-propagation)

         iterator_type deltasEnd   () { return end   (m_deltas); } ///< returns iterator to the end of the deltas (back-propagation)


         const_iterator_type deltasBegin () const { return begin (m_deltas); } ///< returns const iterator to the begin of the deltas (back-propagation)

         const_iterator_type deltasEnd   () const { return end   (m_deltas); } ///< returns const iterator to the end of the deltas (back-propagation)


         iterator_type valueGradientsBegin () { return begin (m_valueGradients); } ///< returns iterator to the begin of the gradients of the node values

         iterator_type valueGradientsEnd   () { return end   (m_valueGradients); } ///< returns iterator to the end of the gradients of the node values


         const_iterator_type valueGradientsBegin () const { return begin (m_valueGradients); } ///< returns const iterator to the begin of the gradients

         const_iterator_type valueGradientsEnd   () const { return end   (m_valueGradients); } ///< returns const iterator to the end of the gradients


         iterator_type gradientsBegin () { assert (m_hasGradients); return m_itGradientBegin; } ///< returns iterator to the begin of the gradients

         const_iterator_type gradientsBegin () const { assert (m_hasGradients); return m_itGradientBegin; } ///< returns const iterator to the begin of the gradients

         const_iterator_type weightsBegin   () const { assert (m_hasWeights); return m_itConstWeightBegin; } ///< returns const iterator to the begin of the weights for this layer


         std::shared_ptr<std::function<double(double)>> activationFunction () const { return m_activationFunction; }

         std::shared_ptr<std::function<double(double)>> inverseActivationFunction () const { return m_inverseActivationFunction; }


         /*! \brief set the drop-out info for this layer

          *

          */

         template <typename Iterator>

            void setDropOut (Iterator itDrop) { m_itDropOut = itDrop; m_hasDropOut = true; }


         /*! \brief clear the drop-out-data for this layer

          *

          *

          */

         void clearDropOut () { m_hasDropOut = false; }


         bool hasDropOut () const { return m_hasDropOut; } ///< has this layer drop-out turned on?

    const_dropout_iterator dropOut () const { assert (m_hasDropOut); return m_itDropOut; } ///< return the begin of the drop-out information


         size_t size () const { return m_size; } ///< return the size of the layer


      private:


         /*! \brief compute the probabilities from the node values

          *

          *

          */

    container_type computeProbabilities () const;


      private:


         size_t m_size; ////< layer size


         const_iterator_type m_itInputBegin; ///< iterator to the first of the nodes in the input node vector

         const_iterator_type m_itInputEnd;   ///< iterator to the end of the nodes in the input node vector


         std::vector<double> m_deltas; ///< stores the deltas for the DNN training

         std::vector<double> m_valueGradients; ///< stores the gradients of the values (nodes)

         std::vector<double> m_values; ///< stores the values of the nodes in this layer

         const_dropout_iterator m_itDropOut; ///< iterator to a container indicating if the corresponding node is to be dropped

         bool m_hasDropOut; ///< dropOut is turned on?


         const_iterator_type m_itConstWeightBegin; ///< const iterator to the first weight of this layer in the weight vector

         iterator_type       m_itGradientBegin;  ///< iterator to the first gradient of this layer in the gradient vector


         std::shared_ptr<std::function<double(double)>> m_activationFunction; ///< activation function for this layer

         std::shared_ptr<std::function<double(double)>> m_inverseActivationFunction; ///< inverse activation function for this layer


         bool m_isInputLayer; ///< is this layer an input layer

         bool m_hasWeights;  ///< does this layer have weights (it does not if it is the input layer)

         bool m_hasGradients; ///< does this layer have gradients (only if in training mode)


         ModeOutputValues m_eModeOutput; ///< stores the output mode (DIRECT, SIGMOID, SOFTMAX)


      };


      /*! \brief Layer defines the layout of a layer

       *

       *     Layer defines the layout of a specific layer in the DNN

       *     Objects of this class don't hold the layer data itself (see class "LayerData")

       *

       */

      class Layer

      {

      public:


         /*! \brief c'tor for defining a Layer

          *

          *

          * \param itInputBegin indicates the start of the input node vector

          * \param itInputEnd indicates the end of the input node vector

          *

          */

         Layer (size_t numNodes, EnumFunction activationFunction, ModeOutputValues eModeOutputValues = ModeOutputValues::DIRECT);


         ModeOutputValues modeOutputValues () const { return m_eModeOutputValues; } ///< get the mode-output-value (direct, probabilities)

         void modeOutputValues (ModeOutputValues eModeOutputValues) { m_eModeOutputValues = eModeOutputValues; } ///< set the mode-output-value


         size_t numNodes () const { return m_numNodes; } ///< return the number of nodes of this layer

         size_t numWeights (size_t numInputNodes) const { return numInputNodes * numNodes (); } ///< return the number of weights for this layer (fully connected)


         std::shared_ptr<std::function<double(double)>> activationFunction  () const { return m_activationFunction; } ///< fetch the activation function for this layer

         std::shared_ptr<std::function<double(double)>> inverseActivationFunction  () const { return m_inverseActivationFunction; } ///< fetch the inverse activation function for this layer


         EnumFunction activationFunctionType () const { return m_activationFunctionType; } ///< get the activation function type for this layer


      private:


         std::shared_ptr<std::function<double(double)>> m_activationFunction;  ///< stores the activation function

         std::shared_ptr<std::function<double(double)>> m_inverseActivationFunction;  ///< stores the inverse activation function


         size_t m_numNodes;


         ModeOutputValues m_eModeOutputValues; ///< do the output values of this layer have to be transformed somehow (e.g. to probabilities) or returned as such

         EnumFunction m_activationFunctionType;


         friend class Net;

      };


      template <typename LAYERDATA>

         void forward (const LAYERDATA& prevLayerData, LAYERDATA& currLayerData);


      template <typename LAYERDATA>

         void backward (LAYERDATA& prevLayerData, LAYERDATA& currLayerData);


      template <typename LAYERDATA>

         void update (const LAYERDATA& prevLayerData, LAYERDATA& currLayerData, double weightDecay, EnumRegularization regularization);


      /*! \brief Settings for the training of the neural net

       *

       *

       */

      class Settings

      {

      public:


         /*! \brief c'tor

          *

          *

          */

         Settings (TString name,

                   size_t _convergenceSteps = 15, size_t _batchSize = 10, size_t _testRepetitions = 7,

                   double _factorWeightDecay = 1e-5, TMVA::DNN::EnumRegularization _regularization = TMVA::DNN::EnumRegularization::NONE,

                   MinimizerType _eMinimizerType = MinimizerType::fSteepest,

                   double _learningRate = 1e-5, double _momentum = 0.3,

                   int _repetitions = 3,

                   bool _multithreading = true);


         /*! \brief d'tor

          *

          *

          */

         virtual ~Settings ();


         /*! \brief set the drop-out configuration (layer-wise)

          *

          * \param begin begin of an array or vector denoting the drop-out probabilities for each layer

          * \param end end of an array or vector denoting the drop-out probabilities for each layer

          * \param _dropRepetitions denotes after how many repetitions the drop-out setting (which nodes are dropped out exactly) is changed

          */

         template <typename Iterator>

            void setDropOut (Iterator begin, Iterator end, size_t _dropRepetitions) { m_dropOut.assign (begin, end); m_dropRepetitions = _dropRepetitions; }


         size_t dropRepetitions () const { return m_dropRepetitions; }

         const std::vector<double>& dropFractions () const { return m_dropOut; }


         void setMonitoring (std::shared_ptr<Monitoring> ptrMonitoring) { fMonitoring = ptrMonitoring; } ///< prepared for monitoring


         size_t convergenceSteps () const { return m_convergenceSteps; } ///< how many steps until training is deemed to have converged

         size_t batchSize () const { return m_batchSize; } ///< mini-batch size

         size_t testRepetitions () const { return m_testRepetitions; } ///< how often is the test data tested

         double factorWeightDecay () const { return m_factorWeightDecay; } ///< get the weight-decay factor


         double learningRate () const { return fLearningRate; } ///< get the learning rate

         double momentum () const { return fMomentum; } ///< get the momentum (e.g. for SGD)

         int repetitions () const { return fRepetitions; } ///< how many steps have to be gone until the batch is changed

         MinimizerType minimizerType () const { return fMinimizerType; } ///< which minimizer shall be used (e.g. SGD)


         virtual void testSample (double /*error*/, double /*output*/, double /*target*/, double /*weight*/) {} ///< virtual function to be used for monitoring (callback)

         virtual void startTrainCycle () ///< callback for monitoring and logging

         {

            m_convergenceCount = 0;

            m_maxConvergenceCount= 0;

            m_minError = 1e10;

         }

         virtual void endTrainCycle (double /*error*/) {} ///< callback for monitoring and logging


         virtual void setProgressLimits (double minProgress = 0, double maxProgress = 100) ///< for monitoring and logging (set the current "progress" limits for the display of the progress)

         {

            m_minProgress = minProgress;

            m_maxProgress = maxProgress;

         }

         virtual void startTraining () ///< start drawing the progress bar

         {

            m_timer.DrawProgressBar (Int_t(m_minProgress));

         }

         virtual void cycle (double progress, TString text) ///< advance on the progress bar

         {

            m_timer.DrawProgressBar (Int_t(m_minProgress+(m_maxProgress-m_minProgress)*(progress/100.0)), text);

         }


         virtual void startTestCycle () {} ///< callback for monitoring and loggging

         virtual void endTestCycle () {} ///< callback for monitoring and loggging

         virtual void testIteration () {} ///< callback for monitoring and loggging

         virtual void drawSample (const std::vector<double>& /*input*/, const std::vector<double>& /* output */, const std::vector<double>& /* target */, double /* patternWeight */) {} ///< callback for monitoring and loggging


         virtual void computeResult (const Net& /* net */, std::vector<double>& /* weights */) {} ///< callback for monitoring and loggging


         virtual bool hasConverged (double testError); ///< has this training converged already?


         EnumRegularization regularization () const { return m_regularization; } ///< some regularization of the DNN is turned on?


         bool useMultithreading () const { return m_useMultithreading; } ///< is multithreading turned on?


         void pads (int numPads) { if (fMonitoring) fMonitoring->pads (numPads); } ///< preparation for monitoring

         void create (std::string histoName, int bins, double min, double max) { if (fMonitoring) fMonitoring->create (histoName, bins, min, max); } ///< for monitoring

         void create (std::string histoName, int bins, double min, double max, int bins2, double min2, double max2) { if (fMonitoring) fMonitoring->create (histoName, bins, min, max, bins2, min2, max2); } ///< for monitoring

         void addPoint (std::string histoName, double x) { if (fMonitoring) fMonitoring->addPoint (histoName, x); } ///< for monitoring

         void addPoint (std::string histoName, double x, double y) {if (fMonitoring) fMonitoring->addPoint (histoName, x, y); } ///< for monitoring

         void plot (std::string histoName, std::string options, int pad, EColor color) { if (fMonitoring) fMonitoring->plot (histoName, options, pad, color); } ///< for monitoring

         void clear (std::string histoName) { if (fMonitoring) fMonitoring->clear (histoName); } ///< for monitoring

         bool exists (std::string histoName) { if (fMonitoring) return fMonitoring->exists (histoName); return false; } ///< for monitoring


         size_t convergenceCount () const { return m_convergenceCount; } ///< returns the current convergence count

         size_t maxConvergenceCount () const { return m_maxConvergenceCount; } ///< returns the max convergence count so far

         size_t minError () const { return m_minError; } ///< returns the smallest error so far


      public:

         Timer  m_timer; ///< timer for monitoring

         double m_minProgress; ///< current limits for the progress bar

         double m_maxProgress; ///< current limits for the progress bar


         size_t m_convergenceSteps; ///< number of steps without improvement to consider the DNN to have converged

         size_t m_batchSize; ///< mini-batch size

         size_t m_testRepetitions;

         double m_factorWeightDecay;


         size_t count_E;

         size_t count_dE;

         size_t count_mb_E;

         size_t count_mb_dE;


         EnumRegularization m_regularization;


         double m_dropRepetitions;

         std::vector<double> m_dropOut;


         double fLearningRate;

         double fMomentum;

         int fRepetitions;

         MinimizerType fMinimizerType;


         size_t m_convergenceCount;

         size_t m_maxConvergenceCount;

         double m_minError;


      protected:

         bool m_useMultithreading;


         std::shared_ptr<Monitoring> fMonitoring;

      };


      /*! \brief Settings for classification

       *

       * contains additional settings if the DNN problem is classification

       */

      class ClassificationSettings : public Settings

      {

      public:

         /*! \brief c'tor

          *

          *

          */

         ClassificationSettings (TString name,

                                 size_t _convergenceSteps = 15, size_t _batchSize = 10, size_t _testRepetitions = 7,

                                 double _factorWeightDecay = 1e-5, EnumRegularization _regularization = EnumRegularization::NONE,

                                 size_t _scaleToNumEvents = 0, MinimizerType _eMinimizerType = MinimizerType::fSteepest,

                                 double _learningRate = 1e-5, double _momentum = 0.3, int _repetitions = 3,

                                 bool _useMultithreading = true)

            : Settings (name, _convergenceSteps, _batchSize, _testRepetitions, _factorWeightDecay,

                        _regularization, _eMinimizerType, _learningRate, _momentum, _repetitions, _useMultithreading)

            , m_ams ()

            , m_sumOfSigWeights (0)

            , m_sumOfBkgWeights (0)

            , m_scaleToNumEvents (_scaleToNumEvents)

            , m_cutValue (10.0)

            , m_pResultPatternContainer (NULL)

            , m_fileNameResult ()

            , m_fileNameNetConfig ()

            {

            }


         /*! \brief d'tor

          *

          *

          */

         virtual ~ClassificationSettings ()

            {

            }


         void startTrainCycle ();

         void endTrainCycle (double /*error*/);

         void testIteration () { if (fMonitoring) fMonitoring->ProcessEvents (); }


         /* void createHistograms () */

         /* { */

         /*     std::cout << "is hist ROC existing?" << std::endl; */

         /*     if (m_histROC) */

         /*     { */

         /*         std::cout << "--> yes" << std::endl; */

         /*         fMonitoring->ProcessEvents (); */

         /*         return; */

         /*     } */


         /*     std::cout << "create histograms" << std::endl; */

         /*     TCanvas* canvas = fMonitoring->GetCanvas (); */

         /*     if (canvas) */

         /*     { */

         /*         std::cout << "canvas divide" << std::endl; */

         /*         canvas->cd (); */

         /*         canvas->Divide (2,2); */

         /*     } */

         /*     if (!m_histROC)  */

         /*     {  */

         /*         m_histROC = new TH2F ("ROC","ROC", 1000, 0, 1.0, 1000, 0, 1.0); m_histROC->SetDirectory (0);  */

         /*         m_histROC->SetLineColor (kBlue); */

         /*     } */

         /*     if (!m_histSignificance)  */

         /*     {  */

         /*         m_histSignificance = new TH2F ("Significance", "Significance", 1000, 0,1.0, 5, 0.0, 2.0);  */

         /*         m_histSignificance->SetDirectory (0);  */

         /*         m_histSignificance->SetBit (TH1::kCanRebin);  */

         /*         m_histROC->SetLineColor (kRed); */

         /*     } */

         /*     if (!m_histError)  */

         /*     {  */

         /*         m_histError = new TH1F ("Error", "Error", 100, 0, 100);  */

         /*         m_histError->SetDirectory (0);  */

         /*         m_histError->SetBit (TH1::kCanRebin); */

         /*         m_histROC->SetLineColor (kGreen); */

         /*     } */

         /*     if (!m_histOutputSignal)  */

         /*     {  */

         /*         m_histOutputSignal = new TH1F ("Signal", "Signal", 100, 0, 1.0);   */

         /*         m_histOutputSignal->SetDirectory (0);  */

         /*         m_histOutputSignal->SetBit (TH1::kCanRebin); */

         /*     } */

         /*     if (!m_histOutputBackground)  */

         /*     {  */

         /*         m_histOutputBackground = new TH1F ("Background", "Background", 100, 0, 1.0);  */

         /*         m_histOutputBackground->SetDirectory (0);  */

         /*         m_histOutputBackground->SetBit (TH1::kCanRebin); */

         /*     } */


         /*     fMonitoring->ProcessEvents (); */

         /* } */


         void testSample (double error, double output, double target, double weight);


         virtual void startTestCycle ();

         virtual void endTestCycle ();


         void setWeightSums (double sumOfSigWeights, double sumOfBkgWeights);

         void setResultComputation (std::string _fileNameNetConfig, std::string _fileNameResult, std::vector<Pattern>* _resultPatternContainer);


         std::vector<double> m_input;

         std::vector<double> m_output;

         std::vector<double> m_targets;

         std::vector<double> m_weights;


         std::vector<double> m_ams;

         std::vector<double> m_significances;


         double m_sumOfSigWeights;

         double m_sumOfBkgWeights;

         size_t m_scaleToNumEvents;


         double m_cutValue;

         std::vector<Pattern>* m_pResultPatternContainer;

         std::string m_fileNameResult;

         std::string m_fileNameNetConfig;


         /* TH2F* m_histROC; */

         /* TH2F* m_histSignificance; */


         /* TH1F* m_histError; */

         /* TH1F* m_histOutputSignal; */

         /* TH1F* m_histOutputBackground; */

      };


      ///< used to distinguish between different function signatures

      enum class ModeOutput

      {

         FETCH

            };


      /*! \brief error functions to be chosen from

       *

       *

       */

      enum class ModeErrorFunction

      {

         SUMOFSQUARES = 'S',

            CROSSENTROPY = 'C',

            CROSSENTROPY_MUTUALEXCLUSIVE = 'M'

            };


      /*! \brief weight initialization strategies to be chosen from

       *

       *

       */

      enum class WeightInitializationStrategy

      {

         XAVIER, TEST, LAYERSIZE, XAVIERUNIFORM

            };


      /*! \brief neural net

       *

       * holds the structure of all layers and some data for the whole net

       * does not know the layer data though (i.e. values of the nodes and weights)

       */

      class Net

      {

      public:


         typedef std::vector<double> container_type;

         typedef container_type::iterator iterator_type;

         typedef std::pair<iterator_type,iterator_type> begin_end_type;


         /*! \brief c'tor

          *

          *

          */

         Net ()

            : m_eErrorFunction (ModeErrorFunction::SUMOFSQUARES)

            , m_sizeInput (0)

            , m_layers ()

            {

            }


         /*! \brief d'tor

          *

          *

          */

         Net (const Net& other)

            : m_eErrorFunction (other.m_eErrorFunction)

            , m_sizeInput (other.m_sizeInput)

            , m_layers (other.m_layers)

            {

            }


         void setInputSize (size_t sizeInput) { m_sizeInput = sizeInput; } ///< set the input size of the DNN

         void setOutputSize (size_t sizeOutput) { m_sizeOutput = sizeOutput; } ///< set the output size of the DNN

         void addLayer (Layer& layer) { m_layers.push_back (layer); } ///< add a layer (layout)

         void addLayer (Layer&& layer) { m_layers.push_back (layer); }

         void setErrorFunction (ModeErrorFunction eErrorFunction) { m_eErrorFunction = eErrorFunction; } ///< which error function is to be used


         size_t inputSize () const { return m_sizeInput; } ///< input size of the DNN

         size_t outputSize () const { return m_sizeOutput; } ///< output size of the DNN


         /*! \brief set the drop out configuration

          *

          *

          */

         template <typename WeightsType, typename DropProbabilities>

            void dropOutWeightFactor (WeightsType& weights,

                                      const DropProbabilities& drops,

                                      bool inverse = false);


         /*! \brief start the training

          *

          * \param weights weight vector

          * \param trainPattern training pattern

          * \param testPattern test pattern

          * \param minimizer use this minimizer for training (e.g. SGD)

          * \param settings settings used for this training run

          */

         template <typename Minimizer>

            double train (std::vector<double>& weights,

                          std::vector<Pattern>& trainPattern,

                          const std::vector<Pattern>& testPattern,

                  Minimizer& minimizer,

                  Settings& settings);


         /*! \brief pre-training for future use

          *

          *

          */

         template <typename Minimizer>

            void preTrain (std::vector<double>& weights,

                           std::vector<Pattern>& trainPattern,

                           const std::vector<Pattern>& testPattern,

                           Minimizer& minimizer, Settings& settings);


         /*! \brief executes one training cycle

          *

          * \param minimizier the minimizer to be used

          * \param weights the weight vector to be used

          * \param itPatternBegin the pattern to be trained with

          * \param itPatternEnd the pattern to be trainied with

          * \param settings the settings for the training

          * \param dropContainer the configuration for DNN drop-out

          */

         template <typename Iterator, typename Minimizer>

            inline double trainCycle (Minimizer& minimizer, std::vector<double>& weights,

               Iterator itPatternBegin, Iterator itPatternEnd,

                              Settings& settings,

                              DropContainer& dropContainer);


         size_t numWeights (size_t trainingStartLayer = 0) const; ///< returns the number of weights in this net

    size_t numNodes   (size_t trainingStartLayer = 0) const; ///< returns the number of nodes in this net


         template <typename Weights>

            std::vector<double> compute (const std::vector<double>& input, const Weights& weights) const; ///< compute the net with the given input and the given weights


         template <typename Weights, typename PassThrough>

            double operator() (PassThrough& settingsAndBatch, const Weights& weights) const; ///< execute computation of the DNN for one mini-batch (used by the minimizer); no computation of gradients


         template <typename Weights, typename PassThrough, typename OutContainer>

            double operator() (PassThrough& settingsAndBatch, const Weights& weights, ModeOutput eFetch, OutContainer& outputContainer) const; ///< execute computation of the DNN for one mini-batch; helper function


         template <typename Weights, typename Gradients, typename PassThrough>

        double operator() (PassThrough& settingsAndBatch, Weights& weights, Gradients& gradients) const;  ///< execute computation of the DNN for one mini-batch (used by the minimizer); returns gradients as well


         template <typename Weights, typename Gradients, typename PassThrough, typename OutContainer>

        double operator() (PassThrough& settingsAndBatch, Weights& weights, Gradients& gradients, ModeOutput eFetch, OutContainer& outputContainer) const;


    template <typename LayerContainer, typename DropContainer, typename ItWeight, typename ItGradient>

        std::vector<std::vector<LayerData>> prepareLayerData (LayerContainer& layers,

                                                              Batch& batch,

                                                              const DropContainer& dropContainer,

                                                              ItWeight itWeightBegin,

                                                              ItWeight itWeightEnd,

                                                              ItGradient itGradientBegin,

                                                              ItGradient itGradientEnd,

                                                              size_t& totalNumWeights) const;


    template <typename LayerContainer>

        void forwardPattern (const LayerContainer& _layers,

                             std::vector<LayerData>& layerData) const;


    template <typename LayerContainer, typename LayerPatternContainer>

        void forwardBatch (const LayerContainer& _layers,

                           LayerPatternContainer& layerPatternData,

                           std::vector<double>& valuesMean,

                           std::vector<double>& valuesStdDev,

                           size_t trainFromLayer) const;


    template <typename OutputContainer>

        void fetchOutput (const LayerData& lastLayerData, OutputContainer& outputContainer) const;


    template <typename OutputContainer>

        void fetchOutput (const std::vector<LayerData>& layerPatternData, OutputContainer& outputContainer) const;


    template <typename ItWeight>

        std::tuple</*sumError*/double,/*sumWeights*/double> computeError (const Settings& settings,

                                                                          std::vector<LayerData>& lastLayerData,

                                                                          Batch& batch,

                                                                          ItWeight itWeightBegin,

                                                                          ItWeight itWeightEnd) const;


    template <typename Settings>

        void backPropagate (std::vector<std::vector<LayerData>>& layerPatternData,

                            const Settings& settings,

                            size_t trainFromLayer,

                            size_t totalNumWeights) const;


    /*! \brief main NN computation function

          *

          *

          */

         template <typename LayerContainer, typename PassThrough, typename ItWeight, typename ItGradient, typename OutContainer>

            double forward_backward (LayerContainer& layers, PassThrough& settingsAndBatch,

              ItWeight itWeightBegin, ItWeight itWeightEnd,

                                     ItGradient itGradientBegin, ItGradient itGradientEnd,

                                     size_t trainFromLayer,

                                     OutContainer& outputContainer, bool fetchOutput) const;


         double E ();

         void dE ();


         /*! \brief computes the error of the DNN

          *

          *

          */

         template <typename Container, typename ItWeight>

            double errorFunction (LayerData& layerData,

                                  Container truth,

                                  ItWeight itWeight,

                                  ItWeight itWeightEnd,

                                  double patternWeight,

                                  double factorWeightDecay,

                                  EnumRegularization eRegularization) const;


         const std::vector<Layer>& layers () const { return m_layers; } ///< returns the layers (structure)

         std::vector<Layer>& layers ()  { return m_layers; } ///< returns the layers (structure)


         void removeLayer () { m_layers.pop_back (); } ///< remove one layer


         void clear () ///< clear one layer

         {

            m_layers.clear ();

            m_eErrorFunction = ModeErrorFunction::SUMOFSQUARES;

         }


         template <typename OutIterator>

            void initializeWeights (WeightInitializationStrategy eInitStrategy,

                                    OutIterator itWeight); ///< initialize the weights with the given strategy


      protected:


         void fillDropContainer (DropContainer& dropContainer, double dropFraction, size_t numNodes) const; ///< prepare the drop-out-container (select the nodes which are to be dropped out)


      private:


         ModeErrorFunction m_eErrorFunction; ///< denotes the error function

         size_t m_sizeInput; ///< input size of this DNN

         size_t m_sizeOutput; ///< outut size of this DNN

         std::vector<Layer> m_layers; ///< layer-structure-data


      protected:

         // variables for JsMVA (interactive training in jupyter notebook)

         IPythonInteractive *fInteractive = nullptr;

         bool * fExitFromTraining = nullptr;

         UInt_t *fIPyMaxIter = nullptr, *fIPyCurrentIter = nullptr;


      public:


        // setup ipython interactive variables

        void SetIpythonInteractive(IPythonInteractive* fI, bool* fE, UInt_t *M, UInt_t *C){

          fInteractive = fI;

          fExitFromTraining = fE;

          fIPyMaxIter = M;

          fIPyCurrentIter = C;

        }

      };


typedef std::tuple<Settings&, Batch&, DropContainer&> pass_through_type;


   } // namespace DNN

} // namespace TMVA


// include the implementations (in header file, because they are templated)

#include "TMVA/NeuralNet.icc"


#endif


double
double
Definition: Converters.cxx:921

Monitoring.h

NeuralNet.icc

Pattern.h

R
#define R(a, b, c, d, e, f, g, h, i)
Definition: RSha256.hxx:110

e
#define e(i)
Definition: RSha256.hxx:103

NONE
#define NONE
Definition: Rotated.cxx:52

Int_t
int Int_t
Definition: RtypesCore.h:43

EColor
EColor
Definition: Rtypes.h:63

TApplication.h

name
char name[80]
Definition: TGX11.cxx:109

type
int type
Definition: TGX11.cxx:120

TH1F.h

TH2F.h

sqrt
double sqrt(double)

Timer.h

Function
Double_t(* Function)(Double_t)
Definition: Functor.C:4

R

TMVA::DNN::Batch
The Batch class encapsulates one mini-batch.
Definition: NeuralNet.h:234

TMVA::DNN::Batch::m_itEnd
const_iterator m_itEnd
iterator denoting the end of the batch
Definition: NeuralNet.h:250

TMVA::DNN::Batch::begin
const_iterator begin() const
Definition: NeuralNet.h:243

TMVA::DNN::Batch::end
const_iterator end() const
Definition: NeuralNet.h:244

TMVA::DNN::Batch::Batch
Batch(typename std::vector< Pattern >::const_iterator itBegin, typename std::vector< Pattern >::const_iterator itEnd)
Definition: NeuralNet.h:238

TMVA::DNN::Batch::size
size_t size() const
Definition: NeuralNet.h:246

TMVA::DNN::Batch::const_iterator
std::vector< Pattern >::const_iterator const_iterator
Definition: NeuralNet.h:236

TMVA::DNN::Batch::m_itBegin
const_iterator m_itBegin
iterator denoting the beginning of the batch
Definition: NeuralNet.h:249

TMVA::DNN::ClassificationSettings
Settings for classificationused to distinguish between different function signatures.
Definition: NeuralNet.h:900

TMVA::DNN::ClassificationSettings::startTrainCycle
void startTrainCycle()
action to be done when the training cycle is started (e.g.
Definition: NeuralNet.cxx:281

TMVA::DNN::ClassificationSettings::testIteration
void testIteration()
callback for monitoring and loggging
Definition: NeuralNet.h:935

TMVA::DNN::ClassificationSettings::endTrainCycle
void endTrainCycle(double)
action to be done when the training cycle is ended (e.g.
Definition: NeuralNet.cxx:296

TMVA::DNN::ClassificationSettings::endTestCycle
virtual void endTestCycle()
action to be done when the training cycle is ended (e.g.
Definition: NeuralNet.cxx:326

TMVA::DNN::ClassificationSettings::m_pResultPatternContainer
std::vector< Pattern > * m_pResultPatternContainer
Definition: NeuralNet.h:1014

TMVA::DNN::ClassificationSettings::setResultComputation
void setResultComputation(std::string _fileNameNetConfig, std::string _fileNameResult, std::vector< Pattern > *_resultPatternContainer)
preparation for monitoring output
Definition: NeuralNet.cxx:523

TMVA::DNN::ClassificationSettings::m_fileNameResult
std::string m_fileNameResult
Definition: NeuralNet.h:1015

TMVA::DNN::ClassificationSettings::ClassificationSettings
ClassificationSettings(TString name, size_t _convergenceSteps=15, size_t _batchSize=10, size_t _testRepetitions=7, double _factorWeightDecay=1e-5, EnumRegularization _regularization=EnumRegularization::NONE, size_t _scaleToNumEvents=0, MinimizerType _eMinimizerType=MinimizerType::fSteepest, double _learningRate=1e-5, double _momentum=0.3, int _repetitions=3, bool _useMultithreading=true)
c'tor
Definition: NeuralNet.h:906

TMVA::DNN::ClassificationSettings::m_input
std::vector< double > m_input
Definition: NeuralNet.h:1000

TMVA::DNN::ClassificationSettings::m_significances
std::vector< double > m_significances
Definition: NeuralNet.h:1006

TMVA::DNN::ClassificationSettings::m_sumOfSigWeights
double m_sumOfSigWeights
Definition: NeuralNet.h:1009

TMVA::DNN::ClassificationSettings::m_weights
std::vector< double > m_weights
Definition: NeuralNet.h:1003

TMVA::DNN::ClassificationSettings::m_fileNameNetConfig
std::string m_fileNameNetConfig
Definition: NeuralNet.h:1016

TMVA::DNN::ClassificationSettings::~ClassificationSettings
virtual ~ClassificationSettings()
d'tor
Definition: NeuralNet.h:929

TMVA::DNN::ClassificationSettings::m_targets
std::vector< double > m_targets
Definition: NeuralNet.h:1002

TMVA::DNN::ClassificationSettings::testSample
void testSample(double error, double output, double target, double weight)
action to be done after the computation of a test sample (e.g.
Definition: NeuralNet.cxx:304

TMVA::DNN::ClassificationSettings::m_scaleToNumEvents
size_t m_scaleToNumEvents
Definition: NeuralNet.h:1011

TMVA::DNN::ClassificationSettings::startTestCycle
virtual void startTestCycle()
action to be done when the test cycle is started (e.g.
Definition: NeuralNet.cxx:316

TMVA::DNN::ClassificationSettings::m_sumOfBkgWeights
double m_sumOfBkgWeights
Definition: NeuralNet.h:1010

TMVA::DNN::ClassificationSettings::setWeightSums
void setWeightSums(double sumOfSigWeights, double sumOfBkgWeights)
set the weight sums to be scaled to (preparations for monitoring output)
Definition: NeuralNet.cxx:515

TMVA::DNN::ClassificationSettings::m_ams
std::vector< double > m_ams
Definition: NeuralNet.h:1005

TMVA::DNN::ClassificationSettings::m_cutValue
double m_cutValue
Definition: NeuralNet.h:1013

TMVA::DNN::ClassificationSettings::m_output
std::vector< double > m_output
Definition: NeuralNet.h:1001

TMVA::DNN::LayerData
LayerData holds the data of one layer.
Definition: NeuralNet.h:436

TMVA::DNN::LayerData::m_itInputBegin
const_iterator_type m_itInputBegin
iterator to the first of the nodes in the input node vector
Definition: NeuralNet.h:641

TMVA::DNN::LayerData::deltasBegin
const_iterator_type deltasBegin() const
returns const iterator to the begin of the deltas (back-propagation)
Definition: NeuralNet.h:596

TMVA::DNN::LayerData::valuesBegin
iterator_type valuesBegin()
returns iterator to the begin of the (node) values
Definition: NeuralNet.h:587

TMVA::DNN::LayerData::valuesEnd
const_iterator_type valuesEnd() const
returns iterator to the end of the (node) values
Definition: NeuralNet.h:585

TMVA::DNN::LayerData::m_hasGradients
bool m_hasGradients
does this layer have gradients (only if in training mode)
Definition: NeuralNet.h:658

TMVA::DNN::LayerData::m_deltas
std::vector< double > m_deltas
stores the deltas for the DNN training
Definition: NeuralNet.h:644

TMVA::DNN::LayerData::iterator_type
container_type::iterator iterator_type
Definition: NeuralNet.h:440

TMVA::DNN::LayerData::LayerData
LayerData(const_iterator_type itInputBegin, const_iterator_type itInputEnd, ModeOutputValues eModeOutput=ModeOutputValues::DIRECT)
c'tor of LayerData
Definition: NeuralNet.cxx:81

TMVA::DNN::LayerData::setDropOut
void setDropOut(Iterator itDrop)
set the drop-out info for this layer
Definition: NeuralNet.h:616

TMVA::DNN::LayerData::setInput
void setInput(const_iterator_type itInputBegin, const_iterator_type itInputEnd)
change the input iterators
Definition: NeuralNet.h:567

TMVA::DNN::LayerData::function_container_type
std::vector< std::function< double(double)> > function_container_type
Definition: NeuralNet.h:443

TMVA::DNN::LayerData::valuesEnd
iterator_type valuesEnd()
returns iterator to the end of the (node) values
Definition: NeuralNet.h:588

TMVA::DNN::LayerData::m_itDropOut
const_dropout_iterator m_itDropOut
iterator to a container indicating if the corresponding node is to be dropped
Definition: NeuralNet.h:647

TMVA::DNN::LayerData::valueGradientsBegin
iterator_type valueGradientsBegin()
returns iterator to the begin of the gradients of the node values
Definition: NeuralNet.h:599

TMVA::DNN::LayerData::gradientsBegin
iterator_type gradientsBegin()
returns iterator to the begin of the gradients
Definition: NeuralNet.h:605

TMVA::DNN::LayerData::deltasBegin
iterator_type deltasBegin()
returns iterator to the begin of the deltas (back-propagation)
Definition: NeuralNet.h:593

TMVA::DNN::LayerData::m_hasWeights
bool m_hasWeights
does this layer have weights (it does not if it is the input layer)
Definition: NeuralNet.h:657

TMVA::DNN::LayerData::dropOut
const_dropout_iterator dropOut() const
return the begin of the drop-out information
Definition: NeuralNet.h:625

TMVA::DNN::LayerData::~LayerData
~LayerData()
Definition: NeuralNet.h:470

TMVA::DNN::LayerData::LayerData
LayerData(LayerData &&other)
move c'tor of LayerData
Definition: NeuralNet.h:540

TMVA::DNN::LayerData::container_type
std::vector< double > container_type
Definition: NeuralNet.h:438

TMVA::DNN::LayerData::size
size_t size() const
return the size of the layer
Definition: NeuralNet.h:627

TMVA::DNN::LayerData::weightsBegin
const_iterator_type weightsBegin() const
returns const iterator to the begin of the weights for this layer
Definition: NeuralNet.h:607

TMVA::DNN::LayerData::const_function_iterator_type
function_container_type::const_iterator const_function_iterator_type
Definition: NeuralNet.h:445

TMVA::DNN::LayerData::LayerData
LayerData(const LayerData &other)
copy c'tor of LayerData
Definition: NeuralNet.h:517

TMVA::DNN::LayerData::function_iterator_type
function_container_type::iterator function_iterator_type
Definition: NeuralNet.h:444

TMVA::DNN::LayerData::m_values
std::vector< double > m_values
stores the values of the nodes in this layer
Definition: NeuralNet.h:646

TMVA::DNN::LayerData::m_itInputEnd
const_iterator_type m_itInputEnd
iterator to the end of the nodes in the input node vector
Definition: NeuralNet.h:642

TMVA::DNN::LayerData::const_iterator_type
container_type::const_iterator const_iterator_type
Definition: NeuralNet.h:441

TMVA::DNN::LayerData::outputMode
ModeOutputValues outputMode() const
returns the output mode
Definition: NeuralNet.h:590

TMVA::DNN::LayerData::m_itGradientBegin
iterator_type m_itGradientBegin
iterator to the first gradient of this layer in the gradient vector
Definition: NeuralNet.h:651

TMVA::DNN::LayerData::gradientsBegin
const_iterator_type gradientsBegin() const
returns const iterator to the begin of the gradients
Definition: NeuralNet.h:606

TMVA::DNN::LayerData::inverseActivationFunction
std::shared_ptr< std::function< double(double)> > inverseActivationFunction() const
Definition: NeuralNet.h:610

TMVA::DNN::LayerData::deltasEnd
iterator_type deltasEnd()
returns iterator to the end of the deltas (back-propagation)
Definition: NeuralNet.h:594

TMVA::DNN::LayerData::m_valueGradients
std::vector< double > m_valueGradients
stores the gradients of the values (nodes)
Definition: NeuralNet.h:645

TMVA::DNN::LayerData::m_itConstWeightBegin
const_iterator_type m_itConstWeightBegin
const iterator to the first weight of this layer in the weight vector
Definition: NeuralNet.h:650

TMVA::DNN::LayerData::valueGradientsEnd
iterator_type valueGradientsEnd()
returns iterator to the end of the gradients of the node values
Definition: NeuralNet.h:600

TMVA::DNN::LayerData::clear
void clear()
clear the values and the deltas
Definition: NeuralNet.h:578

TMVA::DNN::LayerData::activationFunction
std::shared_ptr< std::function< double(double)> > activationFunction() const
Definition: NeuralNet.h:609

TMVA::DNN::LayerData::computeProbabilities
container_type computeProbabilities() const
compute the probabilities from the node values
Definition: NeuralNet.cxx:140

TMVA::DNN::LayerData::deltasEnd
const_iterator_type deltasEnd() const
returns const iterator to the end of the deltas (back-propagation)
Definition: NeuralNet.h:597

TMVA::DNN::LayerData::m_hasDropOut
bool m_hasDropOut
dropOut is turned on?
Definition: NeuralNet.h:648

TMVA::DNN::LayerData::m_isInputLayer
bool m_isInputLayer
is this layer an input layer
Definition: NeuralNet.h:656

TMVA::DNN::LayerData::m_size
size_t m_size
Definition: NeuralNet.h:639

TMVA::DNN::LayerData::hasDropOut
bool hasDropOut() const
has this layer drop-out turned on?
Definition: NeuralNet.h:624

TMVA::DNN::LayerData::valueGradientsBegin
const_iterator_type valueGradientsBegin() const
returns const iterator to the begin of the gradients
Definition: NeuralNet.h:602

TMVA::DNN::LayerData::valueGradientsEnd
const_iterator_type valueGradientsEnd() const
returns const iterator to the end of the gradients
Definition: NeuralNet.h:603

TMVA::DNN::LayerData::probabilities
container_type probabilities() const
computes the probabilities from the current node values and returns them
Definition: NeuralNet.h:591

TMVA::DNN::LayerData::clearDropOut
void clearDropOut()
clear the drop-out-data for this layer
Definition: NeuralNet.h:622

TMVA::DNN::LayerData::m_eModeOutput
ModeOutputValues m_eModeOutput
stores the output mode (DIRECT, SIGMOID, SOFTMAX)
Definition: NeuralNet.h:660

TMVA::DNN::LayerData::m_inverseActivationFunction
std::shared_ptr< std::function< double(double)> > m_inverseActivationFunction
inverse activation function for this layer
Definition: NeuralNet.h:654

TMVA::DNN::LayerData::const_dropout_iterator
DropContainer::const_iterator const_dropout_iterator
Definition: NeuralNet.h:447

TMVA::DNN::LayerData::valuesBegin
const_iterator_type valuesBegin() const
returns const iterator to the begin of the (node) values
Definition: NeuralNet.h:584

TMVA::DNN::LayerData::m_activationFunction
std::shared_ptr< std::function< double(double)> > m_activationFunction
activation function for this layer
Definition: NeuralNet.h:653

TMVA::DNN::Layer
Layer defines the layout of a layer.
Definition: NeuralNet.h:675

TMVA::DNN::Layer::modeOutputValues
void modeOutputValues(ModeOutputValues eModeOutputValues)
set the mode-output-value
Definition: NeuralNet.h:688

TMVA::DNN::Layer::m_activationFunction
std::shared_ptr< std::function< double(double)> > m_activationFunction
stores the activation function
Definition: NeuralNet.h:701

TMVA::DNN::Layer::activationFunction
std::shared_ptr< std::function< double(double)> > activationFunction() const
fetch the activation function for this layer
Definition: NeuralNet.h:693

TMVA::DNN::Layer::m_numNodes
size_t m_numNodes
Definition: NeuralNet.h:705

TMVA::DNN::Layer::m_inverseActivationFunction
std::shared_ptr< std::function< double(double)> > m_inverseActivationFunction
stores the inverse activation function
Definition: NeuralNet.h:702

TMVA::DNN::Layer::numNodes
size_t numNodes() const
return the number of nodes of this layer
Definition: NeuralNet.h:690

TMVA::DNN::Layer::m_eModeOutputValues
ModeOutputValues m_eModeOutputValues
do the output values of this layer have to be transformed somehow (e.g. to probabilities) or returned...
Definition: NeuralNet.h:707

TMVA::DNN::Layer::numWeights
size_t numWeights(size_t numInputNodes) const
return the number of weights for this layer (fully connected)
Definition: NeuralNet.h:691

TMVA::DNN::Layer::inverseActivationFunction
std::shared_ptr< std::function< double(double)> > inverseActivationFunction() const
fetch the inverse activation function for this layer
Definition: NeuralNet.h:694

TMVA::DNN::Layer::m_activationFunctionType
EnumFunction m_activationFunctionType
Definition: NeuralNet.h:708

TMVA::DNN::Layer::Layer
Layer(size_t numNodes, EnumFunction activationFunction, ModeOutputValues eModeOutputValues=ModeOutputValues::DIRECT)
c'tor for defining a Layer
Definition: NeuralNet.cxx:166

TMVA::DNN::Layer::activationFunctionType
EnumFunction activationFunctionType() const
get the activation function type for this layer
Definition: NeuralNet.h:696

TMVA::DNN::Layer::modeOutputValues
ModeOutputValues modeOutputValues() const
get the mode-output-value (direct, probabilities)
Definition: NeuralNet.h:687

TMVA::DNN::MeanVariance
Definition: NeuralNet.h:74

TMVA::DNN::MeanVariance::mean
double mean() const
Definition: NeuralNet.h:125

TMVA::DNN::MeanVariance::MeanVariance
MeanVariance()
Definition: NeuralNet.h:76

TMVA::DNN::MeanVariance::clear
void clear()
Definition: NeuralNet.h:83

TMVA::DNN::MeanVariance::var_corr
double var_corr() const
Definition: NeuralNet.h:135

TMVA::DNN::MeanVariance::count
int count() const
Definition: NeuralNet.h:123

TMVA::DNN::MeanVariance::add
void add(T value, double weight=1.0)
Definition: NeuralNet.h:92

TMVA::DNN::MeanVariance::stdDev_corr
double stdDev_corr() const
Definition: NeuralNet.h:143

TMVA::DNN::MeanVariance::weights
double weights() const
Definition: NeuralNet.h:124

TMVA::DNN::MeanVariance::m_mean
double m_mean
Definition: NeuralNet.h:149

TMVA::DNN::MeanVariance::m_n
size_t m_n
Definition: NeuralNet.h:147

TMVA::DNN::MeanVariance::m_squared
double m_squared
Definition: NeuralNet.h:150

TMVA::DNN::MeanVariance::m_sumWeights
double m_sumWeights
Definition: NeuralNet.h:148

TMVA::DNN::MeanVariance::add
void add(ITERATOR itBegin, ITERATOR itEnd)
Definition: NeuralNet.h:115

TMVA::DNN::MeanVariance::var
double var() const
Definition: NeuralNet.h:126

TMVA::DNN::MeanVariance::stdDev
double stdDev() const
Definition: NeuralNet.h:144

TMVA::DNN::Net
neural net
Definition: NeuralNet.h:1067

TMVA::DNN::Net::setInputSize
void setInputSize(size_t sizeInput)
set the input size of the DNN
Definition: NeuralNet.h:1097

TMVA::DNN::Net::layers
std::vector< Layer > & layers()
returns the layers (structure)
Definition: NeuralNet.h:1251

TMVA::DNN::Net::forwardBatch
void forwardBatch(const LayerContainer &_layers, LayerPatternContainer &layerPatternData, std::vector< double > &valuesMean, std::vector< double > &valuesStdDev, size_t trainFromLayer) const
Definition: NeuralNet.icc:1245

TMVA::DNN::Net::Net
Net(const Net &other)
d'tor
Definition: NeuralNet.h:1090

TMVA::DNN::Net::fExitFromTraining
bool * fExitFromTraining
Definition: NeuralNet.h:1282

TMVA::DNN::Net::Net
Net()
c'tor
Definition: NeuralNet.h:1079

TMVA::DNN::Net::m_layers
std::vector< Layer > m_layers
layer-structure-data
Definition: NeuralNet.h:1277

TMVA::DNN::Net::fIPyMaxIter
UInt_t * fIPyMaxIter
Definition: NeuralNet.h:1283

TMVA::DNN::Net::SetIpythonInteractive
void SetIpythonInteractive(IPythonInteractive *fI, bool *fE, UInt_t *M, UInt_t *C)
Definition: NeuralNet.h:1288

TMVA::DNN::Net::compute
std::vector< double > compute(const std::vector< double > &input, const Weights &weights) const
compute the net with the given input and the given weights
Definition: NeuralNet.icc:1039

TMVA::DNN::Net::container_type
std::vector< double > container_type
Definition: NeuralNet.h:1070

TMVA::DNN::Net::iterator_type
container_type::iterator iterator_type
Definition: NeuralNet.h:1071

TMVA::DNN::Net::preTrain
void preTrain(std::vector< double > &weights, std::vector< Pattern > &trainPattern, const std::vector< Pattern > &testPattern, Minimizer &minimizer, Settings &settings)
pre-training for future use

TMVA::DNN::Net::fetchOutput
void fetchOutput(const LayerData &lastLayerData, OutputContainer &outputContainer) const
Definition: NeuralNet.icc:1300

TMVA::DNN::Net::inputSize
size_t inputSize() const
input size of the DNN
Definition: NeuralNet.h:1103

TMVA::DNN::Net::clear
void clear()
Definition: NeuralNet.h:1256

TMVA::DNN::Net::begin_end_type
std::pair< iterator_type, iterator_type > begin_end_type
Definition: NeuralNet.h:1072

TMVA::DNN::Net::m_eErrorFunction
ModeErrorFunction m_eErrorFunction
denotes the error function
Definition: NeuralNet.h:1274

TMVA::DNN::Net::dE
void dE()

TMVA::DNN::Net::addLayer
void addLayer(Layer &&layer)
Definition: NeuralNet.h:1100

TMVA::DNN::Net::numNodes
size_t numNodes(size_t trainingStartLayer=0) const
returns the number of nodes in this net
Definition: NeuralNet.cxx:559

TMVA::DNN::Net::train
double train(std::vector< double > &weights, std::vector< Pattern > &trainPattern, const std::vector< Pattern > &testPattern, Minimizer &minimizer, Settings &settings)
start the training
Definition: NeuralNet.icc:712

TMVA::DNN::Net::layers
const std::vector< Layer > & layers() const
returns the layers (structure)
Definition: NeuralNet.h:1250

TMVA::DNN::Net::prepareLayerData
std::vector< std::vector< LayerData > > prepareLayerData(LayerContainer &layers, Batch &batch, const DropContainer &dropContainer, ItWeight itWeightBegin, ItWeight itWeightEnd, ItGradient itGradientBegin, ItGradient itGradientEnd, size_t &totalNumWeights) const
Definition: NeuralNet.icc:1113

TMVA::DNN::Net::setErrorFunction
void setErrorFunction(ModeErrorFunction eErrorFunction)
which error function is to be used
Definition: NeuralNet.h:1101

TMVA::DNN::Net::initializeWeights
void initializeWeights(WeightInitializationStrategy eInitStrategy, OutIterator itWeight)
initialize the weights with the given strategy
Definition: NeuralNet.icc:1483

TMVA::DNN::Net::outputSize
size_t outputSize() const
output size of the DNN
Definition: NeuralNet.h:1104

TMVA::DNN::Net::errorFunction
double errorFunction(LayerData &layerData, Container truth, ItWeight itWeight, ItWeight itWeightEnd, double patternWeight, double factorWeightDecay, EnumRegularization eRegularization) const
computes the error of the DNN
Definition: NeuralNet.icc:1592

TMVA::DNN::Net::forward_backward
double forward_backward(LayerContainer &layers, PassThrough &settingsAndBatch, ItWeight itWeightBegin, ItWeight itWeightEnd, ItGradient itGradientBegin, ItGradient itGradientEnd, size_t trainFromLayer, OutContainer &outputContainer, bool fetchOutput) const
main NN computation function
Definition: NeuralNet.icc:1418

TMVA::DNN::Net::removeLayer
void removeLayer()
remove one layer
Definition: NeuralNet.h:1253

TMVA::DNN::Net::m_sizeOutput
size_t m_sizeOutput
outut size of this DNN
Definition: NeuralNet.h:1276

TMVA::DNN::Net::m_sizeInput
size_t m_sizeInput
input size of this DNN
Definition: NeuralNet.h:1275

TMVA::DNN::Net::trainCycle
double trainCycle(Minimizer &minimizer, std::vector< double > &weights, Iterator itPatternBegin, Iterator itPatternEnd, Settings &settings, DropContainer &dropContainer)
executes one training cycle
Definition: NeuralNet.icc:941

TMVA::DNN::Net::fIPyCurrentIter
UInt_t * fIPyCurrentIter
Definition: NeuralNet.h:1283

TMVA::DNN::Net::operator()
double operator()(PassThrough &settingsAndBatch, const Weights &weights) const
execute computation of the DNN for one mini-batch (used by the minimizer); no computation of gradient...
Definition: NeuralNet.icc:1072

TMVA::DNN::Net::dropOutWeightFactor
void dropOutWeightFactor(WeightsType &weights, const DropProbabilities &drops, bool inverse=false)
set the drop out configuration
Definition: NeuralNet.icc:652

TMVA::DNN::Net::fillDropContainer
void fillDropContainer(DropContainer &dropContainer, double dropFraction, size_t numNodes) const
prepare the drop-out-container (select the nodes which are to be dropped out)
Definition: NeuralNet.cxx:575

TMVA::DNN::Net::addLayer
void addLayer(Layer &layer)
add a layer (layout)
Definition: NeuralNet.h:1099

TMVA::DNN::Net::numWeights
size_t numWeights(size_t trainingStartLayer=0) const
returns the number of weights in this net
Definition: NeuralNet.cxx:543

TMVA::DNN::Net::fInteractive
IPythonInteractive * fInteractive
Definition: NeuralNet.h:1281

TMVA::DNN::Net::E
double E()

TMVA::DNN::Net::computeError
std::tuple< double, double > computeError(const Settings &settings, std::vector< LayerData > &lastLayerData, Batch &batch, ItWeight itWeightBegin, ItWeight itWeightEnd) const
Definition: NeuralNet.icc:1330

TMVA::DNN::Net::setOutputSize
void setOutputSize(size_t sizeOutput)
set the output size of the DNN
Definition: NeuralNet.h:1098

TMVA::DNN::Net::forwardPattern
void forwardPattern(const LayerContainer &_layers, std::vector< LayerData > &layerData) const
Definition: NeuralNet.icc:1225

TMVA::DNN::Net::backPropagate
void backPropagate(std::vector< std::vector< LayerData > > &layerPatternData, const Settings &settings, size_t trainFromLayer, size_t totalNumWeights) const
Definition: NeuralNet.icc:1367

TMVA::DNN::Settings
Settings for the training of the neural net.
Definition: NeuralNet.h:735

TMVA::DNN::Settings::m_batchSize
size_t m_batchSize
mini-batch size
Definition: NeuralNet.h:843

TMVA::DNN::Settings::setDropOut
void setDropOut(Iterator begin, Iterator end, size_t _dropRepetitions)
set the drop-out configuration (layer-wise)
Definition: NeuralNet.h:764

TMVA::DNN::Settings::create
void create(std::string histoName, int bins, double min, double max, int bins2, double min2, double max2)
for monitoring
Definition: NeuralNet.h:825

TMVA::DNN::Settings::useMultithreading
bool useMultithreading() const
is multithreading turned on?
Definition: NeuralNet.h:820

TMVA::DNN::Settings::regularization
EnumRegularization regularization() const
some regularization of the DNN is turned on?
Definition: NeuralNet.h:818

TMVA::DNN::Settings::convergenceCount
size_t convergenceCount() const
returns the current convergence count
Definition: NeuralNet.h:832

TMVA::DNN::Settings::momentum
double momentum() const
get the momentum (e.g. for SGD)
Definition: NeuralNet.h:777

TMVA::DNN::Settings::count_E
size_t count_E
Definition: NeuralNet.h:847

TMVA::DNN::Settings::m_timer
Timer m_timer
timer for monitoring
Definition: NeuralNet.h:837

TMVA::DNN::Settings::testRepetitions
size_t testRepetitions() const
how often is the test data tested
Definition: NeuralNet.h:773

TMVA::DNN::Settings::clear
void clear(std::string histoName)
for monitoring
Definition: NeuralNet.h:829

TMVA::DNN::Settings::endTestCycle
virtual void endTestCycle()
callback for monitoring and loggging
Definition: NeuralNet.h:810

TMVA::DNN::Settings::fMinimizerType
MinimizerType fMinimizerType
Definition: NeuralNet.h:860

TMVA::DNN::Settings::addPoint
void addPoint(std::string histoName, double x, double y)
for monitoring
Definition: NeuralNet.h:827

TMVA::DNN::Settings::setMonitoring
void setMonitoring(std::shared_ptr< Monitoring > ptrMonitoring)
prepared for monitoring
Definition: NeuralNet.h:769

TMVA::DNN::Settings::testIteration
virtual void testIteration()
callback for monitoring and loggging
Definition: NeuralNet.h:811

TMVA::DNN::Settings::m_convergenceSteps
size_t m_convergenceSteps
number of steps without improvement to consider the DNN to have converged
Definition: NeuralNet.h:842

TMVA::DNN::Settings::hasConverged
virtual bool hasConverged(double testError)
has this training converged already?
Definition: NeuralNet.cxx:488

TMVA::DNN::Settings::minimizerType
MinimizerType minimizerType() const
which minimizer shall be used (e.g. SGD)
Definition: NeuralNet.h:779

TMVA::DNN::Settings::m_dropOut
std::vector< double > m_dropOut
Definition: NeuralNet.h:855

TMVA::DNN::Settings::m_minProgress
double m_minProgress
current limits for the progress bar
Definition: NeuralNet.h:838

TMVA::DNN::Settings::cycle
virtual void cycle(double progress, TString text)
Definition: NeuralNet.h:804

TMVA::DNN::Settings::Settings
Settings(TString name, size_t _convergenceSteps=15, size_t _batchSize=10, size_t _testRepetitions=7, double _factorWeightDecay=1e-5, TMVA::DNN::EnumRegularization _regularization=TMVA::DNN::EnumRegularization::NONE, MinimizerType _eMinimizerType=MinimizerType::fSteepest, double _learningRate=1e-5, double _momentum=0.3, int _repetitions=3, bool _multithreading=true)
c'tor
Definition: NeuralNet.cxx:232

TMVA::DNN::Settings::setProgressLimits
virtual void setProgressLimits(double minProgress=0, double maxProgress=100)
Definition: NeuralNet.h:795

TMVA::DNN::Settings::m_maxProgress
double m_maxProgress
current limits for the progress bar
Definition: NeuralNet.h:839

TMVA::DNN::Settings::endTrainCycle
virtual void endTrainCycle(double)
callback for monitoring and logging
Definition: NeuralNet.h:793

TMVA::DNN::Settings::count_dE
size_t count_dE
Definition: NeuralNet.h:848

TMVA::DNN::Settings::drawSample
virtual void drawSample(const std::vector< double > &, const std::vector< double > &, const std::vector< double > &, double)
callback for monitoring and loggging
Definition: NeuralNet.h:812

TMVA::DNN::Settings::learningRate
double learningRate() const
get the learning rate
Definition: NeuralNet.h:776

TMVA::DNN::Settings::m_dropRepetitions
double m_dropRepetitions
Definition: NeuralNet.h:854

TMVA::DNN::Settings::dropFractions
const std::vector< double > & dropFractions() const
Definition: NeuralNet.h:767

TMVA::DNN::Settings::addPoint
void addPoint(std::string histoName, double x)
for monitoring
Definition: NeuralNet.h:826

TMVA::DNN::Settings::~Settings
virtual ~Settings()
d'tor
Definition: NeuralNet.cxx:261

TMVA::DNN::Settings::m_convergenceCount
size_t m_convergenceCount
Definition: NeuralNet.h:862

TMVA::DNN::Settings::m_regularization
EnumRegularization m_regularization
Definition: NeuralNet.h:852

TMVA::DNN::Settings::repetitions
int repetitions() const
how many steps have to be gone until the batch is changed
Definition: NeuralNet.h:778

TMVA::DNN::Settings::m_minError
double m_minError
Definition: NeuralNet.h:864

TMVA::DNN::Settings::testSample
virtual void testSample(double, double, double, double)
virtual function to be used for monitoring (callback)
Definition: NeuralNet.h:786

TMVA::DNN::Settings::plot
void plot(std::string histoName, std::string options, int pad, EColor color)
for monitoring
Definition: NeuralNet.h:828

TMVA::DNN::Settings::startTrainCycle
virtual void startTrainCycle()
Definition: NeuralNet.h:787

TMVA::DNN::Settings::convergenceSteps
size_t convergenceSteps() const
how many steps until training is deemed to have converged
Definition: NeuralNet.h:771

TMVA::DNN::Settings::m_factorWeightDecay
double m_factorWeightDecay
Definition: NeuralNet.h:845

TMVA::DNN::Settings::factorWeightDecay
double factorWeightDecay() const
get the weight-decay factor
Definition: NeuralNet.h:774

TMVA::DNN::Settings::count_mb_dE
size_t count_mb_dE
Definition: NeuralNet.h:850

TMVA::DNN::Settings::m_useMultithreading
bool m_useMultithreading
Definition: NeuralNet.h:868

TMVA::DNN::Settings::count_mb_E
size_t count_mb_E
Definition: NeuralNet.h:849

TMVA::DNN::Settings::exists
bool exists(std::string histoName)
for monitoring
Definition: NeuralNet.h:830

TMVA::DNN::Settings::maxConvergenceCount
size_t maxConvergenceCount() const
returns the max convergence count so far
Definition: NeuralNet.h:833

TMVA::DNN::Settings::pads
void pads(int numPads)
preparation for monitoring
Definition: NeuralNet.h:823

TMVA::DNN::Settings::m_testRepetitions
size_t m_testRepetitions
Definition: NeuralNet.h:844

TMVA::DNN::Settings::fLearningRate
double fLearningRate
Definition: NeuralNet.h:857

TMVA::DNN::Settings::fMomentum
double fMomentum
Definition: NeuralNet.h:858

TMVA::DNN::Settings::batchSize
size_t batchSize() const
mini-batch size
Definition: NeuralNet.h:772

TMVA::DNN::Settings::computeResult
virtual void computeResult(const Net &, std::vector< double > &)
callback for monitoring and loggging
Definition: NeuralNet.h:814

TMVA::DNN::Settings::fMonitoring
std::shared_ptr< Monitoring > fMonitoring
Definition: NeuralNet.h:870

TMVA::DNN::Settings::dropRepetitions
size_t dropRepetitions() const
Definition: NeuralNet.h:766

TMVA::DNN::Settings::create
void create(std::string histoName, int bins, double min, double max)
for monitoring
Definition: NeuralNet.h:824

TMVA::DNN::Settings::fRepetitions
int fRepetitions
Definition: NeuralNet.h:859

TMVA::DNN::Settings::minError
size_t minError() const
returns the smallest error so far
Definition: NeuralNet.h:834

TMVA::DNN::Settings::startTraining
virtual void startTraining()
Definition: NeuralNet.h:800

TMVA::DNN::Settings::m_maxConvergenceCount
size_t m_maxConvergenceCount
Definition: NeuralNet.h:863

TMVA::DNN::Settings::startTestCycle
virtual void startTestCycle()
callback for monitoring and loggging
Definition: NeuralNet.h:809

TMVA::DNN::Steepest
Steepest Gradient Descent algorithm (SGD)
Definition: NeuralNet.h:333

TMVA::DNN::Steepest::m_repetitions
size_t m_repetitions
Definition: NeuralNet.h:336

TMVA::DNN::Steepest::m_beta
double m_beta
internal parameter (momentum)
Definition: NeuralNet.h:371

TMVA::DNN::Steepest::m_localGradients
std::vector< double > m_localGradients
local gradients for reuse in thread.
Definition: NeuralNet.h:375

TMVA::DNN::Steepest::m_prevGradients
std::vector< double > m_prevGradients
vector remembers the gradients of the previous step
Definition: NeuralNet.h:372

TMVA::DNN::Steepest::m_alpha
double m_alpha
internal parameter (learningRate)
Definition: NeuralNet.h:370

TMVA::DNN::Steepest::m_localWeights
std::vector< double > m_localWeights
local weights for reuse in thread.
Definition: NeuralNet.h:374

TMVA::DNN::Steepest::operator()
double operator()(Function &fitnessFunction, Weights &weights, PassThrough &passThrough)
operator to call the steepest gradient descent algorithm
Definition: NeuralNet.icc:271

TMVA::DNN::Steepest::Steepest
Steepest(double learningRate=1e-4, double momentum=0.5, size_t repetitions=10)
c'tor
Definition: NeuralNet.h:347

TMVA::IPythonInteractive
This class is needed by JsMVA, and it's a helper class for tracking errors during the training in Jup...
Definition: MethodBase.h:94

TMVA::Timer
Timing information for training and evaluation of MVA methods.
Definition: Timer.h:58

TMVA::Timer::DrawProgressBar
void DrawProgressBar(Int_t, const TString &comment="")
draws progress bar in color or B&W caution:
Definition: Timer.cxx:203

TString
Basic string class.
Definition: TString.h:131

unsigned int

text
TText * text
Definition: entrylist_figure1.C:10

RooFit::Minimizer
RooCmdArg Minimizer(const char *type, const char *alg=0)
Definition: RooGlobalFunc.cxx:211

sigma
const Double_t sigma
Definition: h1analysisProxy.h:11

y
Double_t y[n]
Definition: legend1.C:17

x
Double_t x[n]
Definition: legend1.C:17

ROOT::Math::Cephes::Q
static double Q[]
Definition: SpecFuncCephes.cxx:294

ROOT::Math::Cephes::C
static double C[]
Definition: SpecFuncCephes.cxx:187

ROOT::Math::Chebyshev::T
double T(double x)
Definition: ChebyshevPol.h:34

ROOT::R::function
void function(const Char_t *name_, T fun, const Char_t *docstring=0)
Definition: RExports.h:151

TMVA::DNN::sumOfSquares
double sumOfSquares(ItOutput itOutputBegin, ItOutput itOutputEnd, ItTruth itTruthBegin, ItTruth itTruthEnd, ItDelta itDelta, ItDelta itDeltaEnd, ItInvActFnc itInvActFnc, double patternWeight)

TMVA::DNN::uniformDouble
double uniformDouble(double minValue, double maxValue)
Definition: NeuralNet.cxx:43

TMVA::DNN::forward
void forward(const LAYERDATA &prevLayerData, LAYERDATA &currLayerData)
apply the weights (and functions) in forward direction of the DNN
Definition: NeuralNet.icc:546

TMVA::DNN::applyFunctions
void applyFunctions(ItValue itValue, ItValue itValueEnd, ItFunction itFunction)

TMVA::DNN::operator|
ModeOutputValues operator|(ModeOutputValues lhs, ModeOutputValues rhs)
Definition: NeuralNet.h:187

TMVA::DNN::ModeOutput
ModeOutput
Definition: NeuralNet.h:1035

TMVA::DNN::ModeOutput::FETCH
@ FETCH

TMVA::DNN::EnumRegularization
EnumRegularization
Definition: NeuralNet.h:172

TMVA::DNN::EnumRegularization::L1MAX
@ L1MAX

TMVA::DNN::EnumRegularization::L2
@ L2

TMVA::DNN::EnumRegularization::L1
@ L1

TMVA::DNN::EnumRegularization::NONE
@ NONE

TMVA::DNN::crossEntropy
double crossEntropy(ItProbability itProbabilityBegin, ItProbability itProbabilityEnd, ItTruth itTruthBegin, ItTruth itTruthEnd, ItDelta itDelta, ItDelta itDeltaEnd, ItInvActFnc itInvActFnc, double patternWeight)
cross entropy error function
Definition: NeuralNet.icc:412

TMVA::DNN::backward
void backward(LAYERDATA &prevLayerData, LAYERDATA &currLayerData)
backward application of the weights (back-propagation of the error)
Definition: NeuralNet.icc:572

TMVA::DNN::weightDecay
double weightDecay(double error, ItWeight itWeight, ItWeight itWeightEnd, double factorWeightDecay, EnumRegularization eRegularization)
compute the weight decay for regularization (L1 or L2)
Definition: NeuralNet.icc:498

TMVA::DNN::operator&=
ModeOutputValues operator&=(ModeOutputValues &lhs, ModeOutputValues rhs)
Definition: NeuralNet.h:203

TMVA::DNN::EnumFunction
EnumFunction
Definition: NeuralNet.h:156

TMVA::DNN::EnumFunction::TANH
@ TANH

TMVA::DNN::EnumFunction::SOFTSIGN
@ SOFTSIGN

TMVA::DNN::EnumFunction::GAUSS
@ GAUSS

TMVA::DNN::EnumFunction::TANHSHIFT
@ TANHSHIFT

TMVA::DNN::EnumFunction::SYMMRELU
@ SYMMRELU

TMVA::DNN::EnumFunction::ZERO
@ ZERO

TMVA::DNN::EnumFunction::LINEAR
@ LINEAR

TMVA::DNN::EnumFunction::SIGMOID
@ SIGMOID

TMVA::DNN::EnumFunction::GAUSSCOMPLEMENT
@ GAUSSCOMPLEMENT

TMVA::DNN::EnumFunction::RELU
@ RELU

TMVA::DNN::regularization
auto regularization(const typename Architecture_t::Matrix_t &A, ERegularization R) -> decltype(Architecture_t::L1Regularization(A))
Evaluate the regularization functional for a given weight matrix.
Definition: Functions.h:238

TMVA::DNN::ModeErrorFunction
ModeErrorFunction
error functions to be chosen from
Definition: NeuralNet.h:1044

TMVA::DNN::ModeErrorFunction::CROSSENTROPY
@ CROSSENTROPY

TMVA::DNN::ModeErrorFunction::SUMOFSQUARES
@ SUMOFSQUARES

TMVA::DNN::ModeErrorFunction::CROSSENTROPY_MUTUALEXCLUSIVE
@ CROSSENTROPY_MUTUALEXCLUSIVE

TMVA::DNN::softMaxCrossEntropy
double softMaxCrossEntropy(ItOutput itProbabilityBegin, ItOutput itProbabilityEnd, ItTruth itTruthBegin, ItTruth itTruthEnd, ItDelta itDelta, ItDelta itDeltaEnd, ItInvActFnc itInvActFnc, double patternWeight)
soft-max-cross-entropy error function (for mutual exclusive cross-entropy)
Definition: NeuralNet.icc:458

TMVA::DNN::WeightInitializationStrategy
WeightInitializationStrategy
weight initialization strategies to be chosen from
Definition: NeuralNet.h:1055

TMVA::DNN::WeightInitializationStrategy::TEST
@ TEST

TMVA::DNN::WeightInitializationStrategy::XAVIERUNIFORM
@ XAVIERUNIFORM

TMVA::DNN::WeightInitializationStrategy::XAVIER
@ XAVIER

TMVA::DNN::WeightInitializationStrategy::LAYERSIZE
@ LAYERSIZE

TMVA::DNN::operator|=
ModeOutputValues operator|=(ModeOutputValues &lhs, ModeOutputValues rhs)
Definition: NeuralNet.h:192

TMVA::DNN::MinimizerType
MinimizerType
< list all the minimizer types
Definition: NeuralNet.h:320

TMVA::DNN::fSteepest
@ fSteepest
SGD.
Definition: NeuralNet.h:321

TMVA::DNN::gaussDouble
double gaussDouble(double mean, double sigma)
Definition: NeuralNet.cxx:35

TMVA::DNN::operator&
ModeOutputValues operator&(ModeOutputValues lhs, ModeOutputValues rhs)
Definition: NeuralNet.h:198

TMVA::DNN::ModeOutputValues
ModeOutputValues
Definition: NeuralNet.h:178

TMVA::DNN::ModeOutputValues::SOFTMAX
@ SOFTMAX

TMVA::DNN::ModeOutputValues::BATCHNORMALIZATION
@ BATCHNORMALIZATION

TMVA::DNN::ModeOutputValues::DIRECT
@ DIRECT

TMVA::DNN::applyWeights
void applyWeights(ItSource itSourceBegin, ItSource itSourceEnd, ItWeight itWeight, ItTarget itTargetBegin, ItTarget itTargetEnd)

TMVA::DNN::pass_through_type
std::tuple< Settings &, Batch &, DropContainer & > pass_through_type
Definition: NeuralNet.h:1299

TMVA::DNN::isFlagSet
bool isFlagSet(T flag, T value)
Definition: NeuralNet.h:211

TMVA::DNN::randomInt
int randomInt(int maxValue)
Definition: NeuralNet.cxx:52

TMVA::DNN::update
void update(ItSource itSource, ItSource itSourceEnd, ItDelta itTargetDeltaBegin, ItDelta itTargetDeltaEnd, ItTargetGradient itTargetGradientBegin, ItGradient itGradient)
update the gradients
Definition: NeuralNet.icc:183

TMVA::DNN::DropContainer
std::vector< char > DropContainer
Definition: NeuralNet.h:218

TMVA::DNN::applyWeightsBackwards
void applyWeightsBackwards(ItSource itCurrBegin, ItSource itCurrEnd, ItWeight itWeight, ItPrev itPrevBegin, ItPrev itPrevEnd)

TMVA
create variable transformations
Definition: GeneticMinimizer.h:21

output
static void output(int code)
Definition: gifencode.c:226