doc/v620/Reference_2LossFunctions_8hxx_source.html

// @(#)root/tmva/tmva/dnn:$Id$

// Author: Simon Pfreundschuh 10/07/16


/*************************************************************************

 * Copyright (C) 2016, Simon Pfreundschuh                                *

 * All rights reserved.                                                  *

 *                                                                       *

 * For the licensing terms see $ROOTSYS/LICENSE.                         *

 * For the list of contributors see $ROOTSYS/README/CREDITS.             *

 *************************************************************************/


 ////////////////////////////////////////////////////////////

 // Implementation of the loss functions for the reference //

 // implementation.                                        //

 ////////////////////////////////////////////////////////////


#include "TMVA/DNN/Architectures/Reference.h"


namespace TMVA

{

namespace DNN

{

//______________________________________________________________________________

template <typename AReal>

AReal TReference<AReal>::MeanSquaredError(const TMatrixT<AReal> &Y, const TMatrixT<AReal> &output,

                                          const TMatrixT<AReal> &weights)

{

   size_t m,n;

   m = Y.GetNrows();

   n = Y.GetNcols();

   AReal result = 0.0;


   for (size_t i = 0; i < m; i++) {

      for (size_t j = 0; j < n; j++) {

         AReal dY = (Y(i,j) - output(i,j));

         result += weights(i, 0) * dY * dY;

      }

   }

   result /= static_cast<AReal>(m * n);

   return result;

}


//______________________________________________________________________________

template <typename AReal>

void TReference<AReal>::MeanSquaredErrorGradients(TMatrixT<AReal> &dY, const TMatrixT<AReal> &Y,

                                                  const TMatrixT<AReal> &output, const TMatrixT<AReal> &weights)

{

   size_t m,n;

   m = Y.GetNrows();

   n = Y.GetNcols();


   dY.Minus(Y, output);

   dY *= -2.0 / static_cast<AReal>(m * n);


   for (size_t i = 0; i < m; i++) {

      for (size_t j = 0; j < n; j++) {

         dY(i, j) *= weights(i, 0);

      }

   }

}


//______________________________________________________________________________

template <typename AReal>

AReal TReference<AReal>::CrossEntropy(const TMatrixT<AReal> &Y, const TMatrixT<AReal> &output,

                                      const TMatrixT<AReal> &weights)

{

   size_t m,n;

   m = Y.GetNrows();

   n = Y.GetNcols();

   AReal result = 0.0;


   for (size_t i = 0; i < m; i++) {

      AReal w = weights(i, 0);

      for (size_t j = 0; j < n; j++) {

         AReal sig = 1.0 / (1.0 + std::exp(-output(i,j)));

         result += w * (Y(i, j) * std::log(sig) + (1.0 - Y(i, j)) * std::log(1.0 - sig));

      }

   }

   result /= -static_cast<AReal>(m * n);

   return result;

}


//______________________________________________________________________________

template <typename AReal>

void TReference<AReal>::CrossEntropyGradients(TMatrixT<AReal> &dY, const TMatrixT<AReal> &Y,

                                              const TMatrixT<AReal> &output, const TMatrixT<AReal> &weights)

{

   size_t m,n;

   m = Y.GetNrows();

   n = Y.GetNcols();


   AReal norm = 1.0 / static_cast<AReal>(m * n);

   for (size_t i = 0; i < m; i++)

   {

      AReal w = weights(i, 0);

      for (size_t j = 0; j < n; j++)

      {

         AReal y   = Y(i,j);

         AReal sig = 1.0 / (1.0 + std::exp(-output(i,j)));

         dY(i, j) = norm * w * (sig - y);

      }

   }

}


//______________________________________________________________________________

template <typename AReal>

AReal TReference<AReal>::SoftmaxCrossEntropy(const TMatrixT<AReal> &Y, const TMatrixT<AReal> &output,

                                             const TMatrixT<AReal> &weights)

{

   size_t m,n;

   m = Y.GetNrows();

   n = Y.GetNcols();

   AReal result = 0.0;


   for (size_t i = 0; i < m; i++) {

      AReal sum = 0.0;

      AReal w = weights(i, 0);

      for (size_t j = 0; j < n; j++) {

         sum += exp(output(i,j));

      }

      for (size_t j = 0; j < n; j++) {

         result += w * Y(i, j) * log(exp(output(i, j)) / sum);

      }

   }

   result /= -static_cast<AReal>(m);

   return result;

}


//______________________________________________________________________________

template <typename AReal>

void TReference<AReal>::SoftmaxCrossEntropyGradients(TMatrixT<AReal> &dY, const TMatrixT<AReal> &Y,

                                                     const TMatrixT<AReal> &output, const TMatrixT<AReal> &weights)

{

   size_t m,n;

   m = Y.GetNrows();

   n = Y.GetNcols();

   AReal norm = 1.0 / m ;


   for (size_t i = 0; i < m; i++)

   {

      AReal sum  = 0.0;

      AReal sumY = 0.0;

      AReal w = weights(i, 0);

      for (size_t j = 0; j < n; j++) {

         sum  += exp(output(i,j));

         sumY += Y(i,j);

      }

      for (size_t j = 0; j < n; j++) {

         dY(i, j) = w * norm * (exp(output(i, j)) / sum * sumY - Y(i, j));

      }

   }

}


} // namespace DNN

} // namespace TMVA

Reference.h

exp
double exp(double)

log
double log(double)

TMVA::DNN::TReference::CrossEntropyGradients
static void CrossEntropyGradients(TMatrixT< AReal > &dY, const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Definition: LossFunctions.hxx:85

TMVA::DNN::TReference::SoftmaxCrossEntropy
static AReal SoftmaxCrossEntropy(const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Softmax transformation is implicitly applied, thus output should hold the linear activations of the l...
Definition: LossFunctions.hxx:107

TMVA::DNN::TReference::CrossEntropy
static AReal CrossEntropy(const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Sigmoid transformation is implicitly applied, thus output should hold the linear activations of the l...
Definition: LossFunctions.hxx:64

TMVA::DNN::TReference::MeanSquaredErrorGradients
static void MeanSquaredErrorGradients(TMatrixT< AReal > &dY, const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Definition: LossFunctions.hxx:45

TMVA::DNN::TReference::SoftmaxCrossEntropyGradients
static void SoftmaxCrossEntropyGradients(TMatrixT< AReal > &dY, const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Definition: LossFunctions.hxx:131

TMVA::DNN::TReference::MeanSquaredError
static AReal MeanSquaredError(const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Definition: LossFunctions.hxx:25

TMatrixTBase::GetNrows
Int_t GetNrows() const
Definition: TMatrixTBase.h:124

TMatrixTBase::GetNcols
Int_t GetNcols() const
Definition: TMatrixTBase.h:127

TMatrixT< AReal >

TMatrixT::Minus
void Minus(const TMatrixT< Element > &a, const TMatrixT< Element > &b)
General matrix summation. Create a matrix C such that C = A - B.
Definition: TMatrixT.cxx:580

y
Double_t y[n]
Definition: legend1.C:17

n
const Int_t n
Definition: legend1.C:16

TMVA
create variable transformations
Definition: GeneticMinimizer.h:21

m
auto * m
Definition: textangle.C:8

sum
static long int sum(long int i)
Definition: Factory.cxx:2276

output
static void output(int code)
Definition: gifencode.c:226