doc/master/LossFunction_8cxx_source.html

// @(#)root/tmva $Id$

// Author: Andreas Hoecker, Peter Speckmayer, Joerg Stelzer, Helge Voss, Jan Therhaag


/**********************************************************************************

 * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

 * Package: TMVA                                                                  *

 * Class  : LossFunction                                                          *

 *                                             *

 *                                                                                *

 * Description:                                                                   *

 *      Implementation (see header for description)                               *

 *                                                                                *

 * Authors (alphabetical):                                                        *

 *      Andreas Hoecker <Andreas.Hocker@cern.ch> - CERN, Switzerland              *

 *      Peter Speckmayer <Peter.Speckmayer@cern.ch> - CERN, Switzerland           *

 *      Joerg Stelzer   <Joerg.Stelzer@cern.ch>  - CERN, Switzerland              *

 *      Jan Therhaag       <Jan.Therhaag@cern.ch>     - U of Bonn, Germany        *

 *      Helge Voss      <Helge.Voss@cern.ch>     - MPI-K Heidelberg, Germany      *

 *                                                                                *

 * Copyright (c) 2005-2011:                                                       *

 *      CERN, Switzerland                                                         *

 *      U. of Victoria, Canada                                                    *

 *      MPI-K Heidelberg, Germany                                                 *

 *      U. of Bonn, Germany                                                       *

 *                                                                                *

 * Redistribution and use in source and binary forms, with or without             *

 * modification, are permitted according to the terms listed in LICENSE           *

 * (http://mva.sourceforge.net/license.txt)                                       *

 **********************************************************************************/


/*! \class TMVA::HuberLossFunction

\ingroup TMVA


Huber Loss Function.


*/


#include "TMVA/LossFunction.h"

#include "TMVA/Config.h"


#include "TMVA/MsgLogger.h"


#include "Rtypes.h"

#include "TMath.h"

#include <iostream>


// multithreading only if the compilation flag is turned on

#ifdef R__USE_IMT

#include <ROOT/TThreadExecutor.hxx>

#include "ROOT/TSeq.hxx"

#endif


////////////////////////////////////////////////////////////////////////////////

/// huber constructor


TMVA::HuberLossFunction::HuberLossFunction(){

    fTransitionPoint = -9999;

    fSumOfWeights = -9999;

    fQuantile = 0.7;      // the quantile value determines the bulk of the data, e.g. 0.7 defines

                          // the core as the first 70% and the tails as the last 30%

}


TMVA::HuberLossFunction::HuberLossFunction(Double_t quantile){

    fSumOfWeights = -9999;

    fTransitionPoint = -9999;

    fQuantile = quantile;

}


////////////////////////////////////////////////////////////////////////////////

/// huber destructor


TMVA::HuberLossFunction::~HuberLossFunction(){


}


////////////////////////////////////////////////////////////////////////////////

/// figure out the residual that determines the separation between the

/// "core" and the "tails" of the residuals distribution


void TMVA::HuberLossFunction::Init(std::vector<LossFunctionEventInfo>& evs){


   // Calculate the residual that separates the core and the tails

   SetSumOfWeights(evs);

   SetTransitionPoint(evs);

}


////////////////////////////////////////////////////////////////////////////////

/// huber, calculate the sum of weights for the events in the vector


// Multithreaded version of HuberLossFunction::CalculateSumOfWeights

#ifdef R__USE_IMT

Double_t TMVA::HuberLossFunction::CalculateSumOfWeights(const std::vector<LossFunctionEventInfo>& evs){

   // need a lambda function to pass to TThreadExecutor::MapReduce

   auto mapFunc = [&evs](UInt_t i) { return evs[i].weight; };

   auto redFunc = [](const std::vector<Double_t> &a) { return std::accumulate(a.begin(), a.end(), 0.0); };


   return TMVA::Config::Instance().GetThreadExecutor().MapReduce(

      mapFunc, ROOT::TSeqU(evs.size()), redFunc, TMVA::Config::Instance().GetThreadExecutor().GetPoolSize());

}


// Standard version of HuberLossFunction::CalculateSumOfWeights

#else

Double_t TMVA::HuberLossFunction::CalculateSumOfWeights(const std::vector<LossFunctionEventInfo>& evs){


   // Calculate the sum of the weights

   Double_t sumOfWeights = 0;

   for(UInt_t i = 0; i<evs.size(); i++)

      sumOfWeights+=evs[i].weight;


   return sumOfWeights;

}

#endif


////////////////////////////////////////////////////////////////////////////////

/// huber, determine the quantile for a given input


Double_t TMVA::HuberLossFunction::CalculateQuantile(std::vector<LossFunctionEventInfo>& evs, Double_t whichQuantile, Double_t sumOfWeights, bool abs){


   // use a lambda function to tell the vector how to sort the LossFunctionEventInfo data structures

   // (sort them in ascending order of residual magnitude) if abs is true

   // otherwise sort them in ascending order of residual

   if(abs)

      std::sort(evs.begin(), evs.end(), [](LossFunctionEventInfo a, LossFunctionEventInfo b){

                                           return TMath::Abs(a.trueValue-a.predictedValue) < TMath::Abs(b.trueValue-b.predictedValue); });

   else

      std::sort(evs.begin(), evs.end(), [](LossFunctionEventInfo a, LossFunctionEventInfo b){

                                           return (a.trueValue-a.predictedValue) < (b.trueValue-b.predictedValue); });

   UInt_t i = 0;

   Double_t temp = 0.0;

   while(i<evs.size()-1 && temp <= sumOfWeights*whichQuantile){

      temp += evs[i].weight;

      i++;

   }

   // edge cases

   // Output warning for low return values

   if(whichQuantile == 0) i=0;             // assume 0th quantile to mean the 0th entry in the ordered series


   // usual returns

   if(abs) return TMath::Abs(evs[i].trueValue-evs[i].predictedValue);

   else return evs[i].trueValue-evs[i].predictedValue;

}


////////////////////////////////////////////////////////////////////////////////

/// huber, determine the transition point using the values for fQuantile and fSumOfWeights

/// which presumably have already been set


void TMVA::HuberLossFunction::SetTransitionPoint(std::vector<LossFunctionEventInfo>& evs){

   fTransitionPoint = CalculateQuantile(evs, fQuantile, fSumOfWeights, true);


   // if the transition point corresponding to the quantile is 0 then the loss function will not function

   // the quantile was chosen too low. Let's use the first nonzero residual as the transition point instead.

   if(fTransitionPoint == 0){

      // evs should already be sorted according to the magnitude of the residuals, since CalculateQuantile does this

      for(UInt_t i=0; i<evs.size(); i++){

         Double_t residual = TMath::Abs(evs[i].trueValue - evs[i].predictedValue);

         if(residual != 0){

            fTransitionPoint = residual;

            break;

         }

      }

   }


   // Let the user know that the transition point is zero and the loss function won't work properly

   if(fTransitionPoint == 0){

      //std::cout << "The residual transition point for the Huber loss function corresponding to quantile, " << fQuantile << ", is zero."

      //<< " This implies that all of the residuals are zero and the events have been predicted perfectly. Perhaps the regression is too complex"

      //<< " for the amount of data." << std::endl;

   }

}


////////////////////////////////////////////////////////////////////////////////

/// huber, set the sum of weights given a collection of events


void TMVA::HuberLossFunction::SetSumOfWeights(std::vector<LossFunctionEventInfo>& evs){

   fSumOfWeights = CalculateSumOfWeights(evs);

}


////////////////////////////////////////////////////////////////////////////////

/// huber,  determine the loss for a single event


Double_t TMVA::HuberLossFunction::CalculateLoss(LossFunctionEventInfo& e){

   // If the huber loss function is uninitialized then assume a group of one

   // and initialize the transition point and weights for this single event

   if(fSumOfWeights == -9999){

      std::vector<LossFunctionEventInfo> evs{e};

      SetSumOfWeights(evs);

      SetTransitionPoint(evs);

   }


   Double_t residual = TMath::Abs(e.trueValue - e.predictedValue);

   Double_t loss = 0;

   // Quadratic loss in terms of the residual for small residuals

   if(residual <= fTransitionPoint) loss = 0.5*residual*residual;

   // Linear loss for large residuals, so that the tails don't dominate the net loss calculation

   else loss = fQuantile*residual - 0.5*fQuantile*fQuantile;

   return e.weight*loss;

}


////////////////////////////////////////////////////////////////////////////////

/// huber, determine the net loss for a collection of events


Double_t TMVA::HuberLossFunction::CalculateNetLoss(std::vector<LossFunctionEventInfo>& evs){

   // Initialize the Huber Loss Function so that we can calculate the loss.

   // The loss for each event depends on the other events in the group

   // that define the cutoff quantile (fTransitionPoint).

   SetSumOfWeights(evs);

   SetTransitionPoint(evs);


   Double_t netloss = 0;

   for(UInt_t i=0; i<evs.size(); i++)

       netloss+=CalculateLoss(evs[i]);

   return netloss;

   // should get a function to return the average loss as well

   // return netloss/fSumOfWeights

}


////////////////////////////////////////////////////////////////////////////////

/// huber, determine the mean loss for a collection of events


Double_t TMVA::HuberLossFunction::CalculateMeanLoss(std::vector<LossFunctionEventInfo>& evs){

   // Initialize the Huber Loss Function so that we can calculate the loss.

   // The loss for each event depends on the other events in the group

   // that define the cutoff quantile (fTransitionPoint).

   SetSumOfWeights(evs);

   SetTransitionPoint(evs);


   Double_t netloss = 0;

   for(UInt_t i=0; i<evs.size(); i++)

       netloss+=CalculateLoss(evs[i]);

   return netloss/fSumOfWeights;

}


/*! \class TMVA::HuberLossFunctionBDT

\ingroup TMVA


Huber BDT Loss Function.


*/


TMVA::HuberLossFunctionBDT::HuberLossFunctionBDT(){

}


////////////////////////////////////////////////////////////////////////////////

/// huber BDT, initialize the targets and prepare for the regression


void TMVA::HuberLossFunctionBDT::Init(std::map<const TMVA::Event*, LossFunctionEventInfo>& evinfomap, std::vector<double>& boostWeights){

// Run this once before building the forest. Set initial prediction to weightedMedian.


   std::vector<LossFunctionEventInfo> evinfovec(evinfomap.size());

   for (auto &e: evinfomap){

      evinfovec.push_back(LossFunctionEventInfo(e.second.trueValue, e.second.predictedValue, e.first->GetWeight()));

   }


   // Calculates fSumOfWeights and fTransitionPoint with the current residuals

   SetSumOfWeights(evinfovec);

   Double_t weightedMedian = CalculateQuantile(evinfovec, 0.5, fSumOfWeights, false);


   //Store the weighted median as a first boosweight for later use

   boostWeights.push_back(weightedMedian);

   for (auto &e: evinfomap ) {

      // set the initial prediction for all events to the median

      e.second.predictedValue += weightedMedian;

   }

}


////////////////////////////////////////////////////////////////////////////////

/// huber BDT, set the targets for a collection of events


// Multithreaded version of HuberLossFunctionBDT::SetTargets

#ifdef R__USE_IMT

void TMVA::HuberLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap){


   std::vector<LossFunctionEventInfo> eventvec(evs.size());


   // first we need to copy the events from evs into eventvec since we require a vector of LossFunctionEventInfo

   // for SetSumOfWeights and SetTransitionPoint. We use TThreadExecutor to implement the copy in parallel

   // need a lambda function to pass to TThreadExecutor::Map

   auto fcopy = [&eventvec, &evs, &evinfomap](UInt_t i) {

      eventvec[i] = LossFunctionEventInfo(evinfomap[evs[i]].trueValue, evinfomap[evs[i]].predictedValue, evs[i]->GetWeight());

   };


   TMVA::Config::Instance().GetThreadExecutor().Foreach(fcopy, ROOT::TSeqU(evs.size()), TMVA::Config::Instance().GetThreadExecutor().GetPoolSize());


   // Recalculate the residual that separates the "core" of the data and the "tails"

   // This residual is the quantile given by fQuantile, defaulted to 0.7

   // the quantile corresponding to 0.5 would be the usual median

   SetSumOfWeights(eventvec); // This was already set in init, but may change if there is subsampling for each tree

   SetTransitionPoint(eventvec);


   // ok now set the targets in parallel

   // need a lambda function to pass to TThreadExecutor::Map

   auto f = [this, &evinfomap](const TMVA::Event* ev) {

      const_cast<TMVA::Event*>(ev)->SetTarget(0, Target(evinfomap[ev]));

   };


   TMVA::Config::Instance().GetThreadExecutor().Foreach(f, evs, TMVA::Config::Instance().GetThreadExecutor().GetPoolSize());

}


// Standard version of HuberLossFunctionBDT::SetTargets

#else

void TMVA::HuberLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap){


   std::vector<LossFunctionEventInfo> eventvec(evs.size());

   for (std::vector<const TMVA::Event*>::const_iterator e=evs.begin(); e!=evs.end();e++){

      eventvec.push_back(LossFunctionEventInfo(evinfomap[*e].trueValue, evinfomap[*e].predictedValue, (*e)->GetWeight()));

   }


   // Recalculate the residual that separates the "core" of the data and the "tails"

   // This residual is the quantile given by fQuantile, defaulted to 0.7

   // the quantile corresponding to 0.5 would be the usual median

   SetSumOfWeights(eventvec); // This was already set in init, but may change if there is subsampling for each tree

   SetTransitionPoint(eventvec);


   for (std::vector<const TMVA::Event*>::const_iterator e=evs.begin(); e!=evs.end();e++) {

         const_cast<TMVA::Event*>(*e)->SetTarget(0,Target(evinfomap[*e]));

   }

}

#endif


////////////////////////////////////////////////////////////////////////////////

/// huber BDT, set the target for a single event


Double_t TMVA::HuberLossFunctionBDT::Target(LossFunctionEventInfo& e){

    Double_t residual = e.trueValue - e.predictedValue;

    // The weight/target relationships are taken care of in the tmva decision tree operations so we don't need to worry about that here

    if(TMath::Abs(residual) <= fTransitionPoint) return residual;

    else return fTransitionPoint*(residual<0?-1.0:1.0);

}


////////////////////////////////////////////////////////////////////////////////

/// huber BDT, determine the fit value for the terminal node based upon the

/// events in the terminal node


Double_t TMVA::HuberLossFunctionBDT::Fit(std::vector<LossFunctionEventInfo>& evs){

// The fit in the terminal node for huber is basically the median of the residuals.

// Then you add the average difference from the median to that.

// The tails are discounted. If a residual is in the tails then we just use the

// cutoff residual that sets the "core" and the "tails" instead of the large residual.

// So we get something between least squares (mean as fit) and absolute deviation (median as fit).

   Double_t sumOfWeights = CalculateSumOfWeights(evs);

   Double_t shift=0,diff= 0;

   Double_t residualMedian = CalculateQuantile(evs,0.5,sumOfWeights, false);

   for(UInt_t j=0;j<evs.size();j++){

      Double_t residual = evs[j].trueValue - evs[j].predictedValue;

      diff = residual-residualMedian;

      // if we are using weights then I'm not sure why this isn't weighted

      shift+=1.0/evs.size()*((diff<0)?-1.0:1.0)*TMath::Min(fTransitionPoint,fabs(diff));

      // I think this should be

      // shift+=evs[j].weight/sumOfWeights*((diff<0)?-1.0:1.0)*TMath::Min(fTransitionPoint,fabs(diff));

      // not sure why it was originally coded like this

   }

   return (residualMedian + shift);


}


/*! \class TMVA::LeastSquaresLossFunction

\ingroup TMVA


Least Squares Loss Function.


*/


// Constructor and destructor are in header file. They don't do anything.


////////////////////////////////////////////////////////////////////////////////

/// least squares ,  determine the loss for a single event


Double_t TMVA::LeastSquaresLossFunction::CalculateLoss(LossFunctionEventInfo& e){

   Double_t residual = (e.trueValue - e.predictedValue);

   Double_t loss = 0;

   loss = residual*residual;

   return e.weight*loss;

}


////////////////////////////////////////////////////////////////////////////////

/// least squares , determine the net loss for a collection of events


Double_t TMVA::LeastSquaresLossFunction::CalculateNetLoss(std::vector<LossFunctionEventInfo>& evs){

   Double_t netloss = 0;

   for(UInt_t i=0; i<evs.size(); i++)

       netloss+=CalculateLoss(evs[i]);

   return netloss;

   // should get a function to return the average loss as well

   // return netloss/fSumOfWeights

}


////////////////////////////////////////////////////////////////////////////////

/// least squares , determine the mean loss for a collection of events


Double_t TMVA::LeastSquaresLossFunction::CalculateMeanLoss(std::vector<LossFunctionEventInfo>& evs){

   Double_t netloss = 0;

   Double_t sumOfWeights = 0;

   for(UInt_t i=0; i<evs.size(); i++){

       sumOfWeights+=evs[i].weight;

       netloss+=CalculateLoss(evs[i]);

   }

   // return the weighted mean

   return netloss/sumOfWeights;

}


/*! \class TMVA::LeastSquaresLossFunctionBDT

\ingroup TMVA


Least Squares BDT Loss Function.


*/


// Constructor and destructor defined in header. They don't do anything.


////////////////////////////////////////////////////////////////////////////////

/// least squares BDT, initialize the targets and prepare for the regression


void TMVA::LeastSquaresLossFunctionBDT::Init(std::map<const TMVA::Event*, LossFunctionEventInfo>& evinfomap, std::vector<double>& boostWeights){

// Run this once before building the forest. Set initial prediction to the weightedMean


   std::vector<LossFunctionEventInfo> evinfovec(evinfomap.size());

   for (auto &e: evinfomap){

      evinfovec.push_back(LossFunctionEventInfo(e.second.trueValue, e.second.predictedValue, e.first->GetWeight()));

   }


   // Initial prediction for least squares is the weighted mean

   Double_t weightedMean = Fit(evinfovec);


   //Store the weighted median as a first boosweight for later use

   boostWeights.push_back(weightedMean);

   for (auto &e: evinfomap ) {

      // set the initial prediction for all events to the median

      e.second.predictedValue += weightedMean;

   }

}


////////////////////////////////////////////////////////////////////////////////

/// least squares BDT, set the targets for a collection of events


// Multithreaded version of LeastSquaresLossFunctionBDT::SetTargets

#ifdef R__USE_IMT

void TMVA::LeastSquaresLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap) {


   // need a lambda function to pass to TThreadExecutor::Map

   auto f = [this, &evinfomap](const TMVA::Event* ev) {

      const_cast<TMVA::Event*>(ev)->SetTarget(0, Target(evinfomap[ev]));

   };


   TMVA::Config::Instance().GetThreadExecutor().Foreach(f, evs, TMVA::Config::Instance().GetThreadExecutor().GetPoolSize());

}

// Standard version of LeastSquaresLossFunctionBDT::SetTargets

#else

void TMVA::LeastSquaresLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap){


   for (std::vector<const TMVA::Event*>::const_iterator e=evs.begin(); e!=evs.end();e++) {

         const_cast<TMVA::Event*>(*e)->SetTarget(0,Target(evinfomap[*e]));

   }

}

#endif


////////////////////////////////////////////////////////////////////////////////

/// least squares BDT, set the target for a single event


Double_t TMVA::LeastSquaresLossFunctionBDT::Target(LossFunctionEventInfo& e){

    Double_t residual = e.trueValue - e.predictedValue;

    // The weight/target relationships are taken care of in the tmva decision tree operations. We don't need to worry about that here

    // and we return the residual instead of the weight*residual.

    return residual;

}


////////////////////////////////////////////////////////////////////////////////

/// huber BDT, determine the fit value for the terminal node based upon the

/// events in the terminal node


Double_t TMVA::LeastSquaresLossFunctionBDT::Fit(std::vector<LossFunctionEventInfo>& evs){

// The fit in the terminal node for least squares is the weighted average of the residuals.

   Double_t sumOfWeights = 0;

   Double_t weightedResidualSum = 0;

   for(UInt_t j=0;j<evs.size();j++){

      sumOfWeights += evs[j].weight;

      Double_t residual = evs[j].trueValue - evs[j].predictedValue;

      weightedResidualSum += evs[j].weight*residual;

   }

   Double_t weightedMean = weightedResidualSum/sumOfWeights;


   // return the weighted mean

   return weightedMean;

}


/*! \class TMVA::AbsoluteDeviationLossFunction

\ingroup TMVA


Absolute Deviation Loss Function.


*/


// Constructors in the header. They don't do anything.


////////////////////////////////////////////////////////////////////////////////

/// absolute deviation,  determine the loss for a single event


Double_t TMVA::AbsoluteDeviationLossFunction::CalculateLoss(LossFunctionEventInfo& e){

   Double_t residual = e.trueValue - e.predictedValue;

   return e.weight*TMath::Abs(residual);

}


////////////////////////////////////////////////////////////////////////////////

/// absolute deviation, determine the net loss for a collection of events


Double_t TMVA::AbsoluteDeviationLossFunction::CalculateNetLoss(std::vector<LossFunctionEventInfo>& evs){


   Double_t netloss = 0;

   for(UInt_t i=0; i<evs.size(); i++)

       netloss+=CalculateLoss(evs[i]);

   return netloss;

}


////////////////////////////////////////////////////////////////////////////////

/// absolute deviation, determine the mean loss for a collection of events


Double_t TMVA::AbsoluteDeviationLossFunction::CalculateMeanLoss(std::vector<LossFunctionEventInfo>& evs){

   Double_t sumOfWeights = 0;

   Double_t netloss = 0;

   for(UInt_t i=0; i<evs.size(); i++){

       sumOfWeights+=evs[i].weight;

       netloss+=CalculateLoss(evs[i]);

   }

   return netloss/sumOfWeights;

}


/*! \class TMVA::AbsoluteDeviationLossFunctionBDT

\ingroup TMVA


Absolute Deviation BDT Loss Function.


*/


////////////////////////////////////////////////////////////////////////////////

/// absolute deviation BDT, initialize the targets and prepare for the regression


void TMVA::AbsoluteDeviationLossFunctionBDT::Init(std::map<const TMVA::Event*, LossFunctionEventInfo>& evinfomap, std::vector<double>& boostWeights){

// Run this once before building the forest. Set initial prediction to weightedMedian.


   std::vector<LossFunctionEventInfo> evinfovec(evinfomap.size());

   for (auto &e: evinfomap){

      evinfovec.push_back(LossFunctionEventInfo(e.second.trueValue, e.second.predictedValue, e.first->GetWeight()));

   }


   Double_t weightedMedian = Fit(evinfovec);


   //Store the weighted median as a first boostweight for later use

   boostWeights.push_back(weightedMedian);

   for (auto &e: evinfomap ) {

      // set the initial prediction for all events to the median

      e.second.predictedValue += weightedMedian;

   }

}


////////////////////////////////////////////////////////////////////////////////

/// absolute deviation BDT, set the targets for a collection of events


// Multithreaded version of AbsoluteDeviationLossFunctionBDT::SetTargets

#ifdef R__USE_IMT

void TMVA::AbsoluteDeviationLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap){

   // need a lambda function to pass to TThreadExecutor::Map

   auto f = [this, &evinfomap](const TMVA::Event* ev) {

         const_cast<TMVA::Event*>(ev)->SetTarget(0, Target(evinfomap[ev]));

   };


   TMVA::Config::Instance().GetThreadExecutor().Foreach(f, evs, TMVA::Config::Instance().GetThreadExecutor().GetPoolSize());

}

// Standard version of AbsoluteDeviationLossFunctionBDT::SetTargets

#else

void TMVA::AbsoluteDeviationLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap){


   for (std::vector<const TMVA::Event*>::const_iterator e=evs.begin(); e!=evs.end();e++) {

         const_cast<TMVA::Event*>(*e)->SetTarget(0,Target(evinfomap[*e]));

   }

}

#endif


////////////////////////////////////////////////////////////////////////////////

/// absolute deviation BDT, set the target for a single event


Double_t TMVA::AbsoluteDeviationLossFunctionBDT::Target(LossFunctionEventInfo& e){

// The target is the sign of the residual.

    Double_t residual = e.trueValue - e.predictedValue;

    // The weight/target relationships are taken care of in the tmva decision tree operations so we don't need to worry about that here

    return (residual<0?-1.0:1.0);

}


////////////////////////////////////////////////////////////////////////////////

/// absolute deviation BDT, determine the fit value for the terminal node based upon the

/// events in the terminal node


Double_t TMVA::AbsoluteDeviationLossFunctionBDT::Fit(std::vector<LossFunctionEventInfo>& evs){

// For Absolute Deviation, the fit in each terminal node is the weighted residual median.


   // use a lambda function to tell the vector how to sort the LossFunctionEventInfo data structures

   // sort in ascending order of residual value

   std::sort(evs.begin(), evs.end(), [](LossFunctionEventInfo a, LossFunctionEventInfo b){

                                        return (a.trueValue-a.predictedValue) < (b.trueValue-b.predictedValue); });


   // calculate the sum of weights, used in the weighted median calculation

   Double_t sumOfWeights = 0;

   for(UInt_t j=0; j<evs.size(); j++)

      sumOfWeights+=evs[j].weight;


   // get the index of the weighted median

   UInt_t i = 0;

   Double_t temp = 0.0;

   while(i<evs.size() && temp <= sumOfWeights*0.5){

      temp += evs[i].weight;

      i++;

   }

   if (i >= evs.size()) return 0.; // prevent uncontrolled memory access in return value calculation


   // return the median residual

   return evs[i].trueValue-evs[i].predictedValue;

}

LossFunction.h

MsgLogger.h

b
#define b(i)
Definition RSha256.hxx:100

f
#define f(i)
Definition RSha256.hxx:104

a
#define a(i)
Definition RSha256.hxx:99

e
#define e(i)
Definition RSha256.hxx:103

UInt_t
unsigned int UInt_t
Definition RtypesCore.h:46

Double_t
double Double_t
Definition RtypesCore.h:59

Rtypes.h

TMath.h

TSeq.hxx

TThreadExecutor.hxx

ROOT::TSeq
A pseudo container class which is a generator of indices.
Definition TSeq.hxx:67

TMVA::AbsoluteDeviationLossFunctionBDT::Fit
Double_t Fit(std::vector< LossFunctionEventInfo > &evs)
absolute deviation BDT, determine the fit value for the terminal node based upon the events in the te...
Definition LossFunction.cxx:591

TMVA::AbsoluteDeviationLossFunctionBDT::SetTargets
void SetTargets(std::vector< const TMVA::Event * > &evs, std::map< const TMVA::Event *, LossFunctionEventInfo > &evinfomap)
absolute deviation BDT, set the targets for a collection of events
Definition LossFunction.cxx:559

TMVA::AbsoluteDeviationLossFunctionBDT::Init
void Init(std::map< const TMVA::Event *, LossFunctionEventInfo > &evinfomap, std::vector< double > &boostWeights)
absolute deviation BDT, initialize the targets and prepare for the regression
Definition LossFunction.cxx:536

TMVA::AbsoluteDeviationLossFunctionBDT::Target
Double_t Target(LossFunctionEventInfo &e)
absolute deviation BDT, set the target for a single event
Definition LossFunction.cxx:580

TMVA::AbsoluteDeviationLossFunction::CalculateNetLoss
Double_t CalculateNetLoss(std::vector< LossFunctionEventInfo > &evs)
absolute deviation, determine the net loss for a collection of events
Definition LossFunction.cxx:505

TMVA::AbsoluteDeviationLossFunction::CalculateMeanLoss
Double_t CalculateMeanLoss(std::vector< LossFunctionEventInfo > &evs)
absolute deviation, determine the mean loss for a collection of events
Definition LossFunction.cxx:516

TMVA::AbsoluteDeviationLossFunction::CalculateLoss
Double_t CalculateLoss(LossFunctionEventInfo &e)
absolute deviation, determine the loss for a single event
Definition LossFunction.cxx:497

TMVA::Config::GetThreadExecutor
Executor & GetThreadExecutor()
Get executor class for multi-thread usage In case when MT is not enabled will return a serial executo...
Definition Config.h:81

TMVA::Config::Instance
static Config & Instance()
static function: returns TMVA instance
Definition Config.cxx:98

TMVA::Event
Definition Event.h:51

TMVA::Event::SetTarget
void SetTarget(UInt_t itgt, Float_t value)
set the target value (dimension itgt) to value
Definition Event.cxx:367

TMVA::Executor::Foreach
void Foreach(Function func, unsigned int nTimes, unsigned nChunks=0)
wrap TExecutor::Foreach
Definition Executor.h:117

TMVA::Executor::MapReduce
auto MapReduce(F func, ROOT::TSeq< INTEGER > args, R redfunc) -> InvokeResult_t< F, INTEGER >
Wrap TExecutor::MapReduce functions.
Definition Executor.h:154

TMVA::Executor::GetPoolSize
unsigned int GetPoolSize() const
Definition Executor.h:106

TMVA::HuberLossFunctionBDT::Target
Double_t Target(LossFunctionEventInfo &e)
huber BDT, set the target for a single event
Definition LossFunction.cxx:323

TMVA::HuberLossFunctionBDT::HuberLossFunctionBDT
HuberLossFunctionBDT()
Definition LossFunction.cxx:240

TMVA::HuberLossFunctionBDT::Fit
Double_t Fit(std::vector< LossFunctionEventInfo > &evs)
huber BDT, determine the fit value for the terminal node based upon the events in the terminal node
Definition LossFunction.cxx:334

TMVA::HuberLossFunctionBDT::Init
void Init(std::map< const TMVA::Event *, LossFunctionEventInfo > &evinfomap, std::vector< double > &boostWeights)
huber BDT, initialize the targets and prepare for the regression
Definition LossFunction.cxx:246

TMVA::HuberLossFunctionBDT::SetTargets
void SetTargets(std::vector< const TMVA::Event * > &evs, std::map< const TMVA::Event *, LossFunctionEventInfo > &evinfomap)
huber BDT, set the targets for a collection of events
Definition LossFunction.cxx:271

TMVA::HuberLossFunction::HuberLossFunction
HuberLossFunction()
huber constructor
Definition LossFunction.cxx:56

TMVA::HuberLossFunction::SetSumOfWeights
void SetSumOfWeights(std::vector< LossFunctionEventInfo > &evs)
huber, set the sum of weights given a collection of events
Definition LossFunction.cxx:174

TMVA::HuberLossFunction::SetTransitionPoint
void SetTransitionPoint(std::vector< LossFunctionEventInfo > &evs)
huber, determine the transition point using the values for fQuantile and fSumOfWeights which presumab...
Definition LossFunction.cxx:147

TMVA::HuberLossFunction::CalculateNetLoss
Double_t CalculateNetLoss(std::vector< LossFunctionEventInfo > &evs)
huber, determine the net loss for a collection of events
Definition LossFunction.cxx:202

TMVA::HuberLossFunction::fSumOfWeights
Double_t fSumOfWeights
Definition LossFunction.h:170

TMVA::HuberLossFunction::CalculateLoss
Double_t CalculateLoss(LossFunctionEventInfo &e)
huber, determine the loss for a single event
Definition LossFunction.cxx:181

TMVA::HuberLossFunction::fQuantile
Double_t fQuantile
Definition LossFunction.h:168

TMVA::HuberLossFunction::~HuberLossFunction
~HuberLossFunction()
huber destructor
Definition LossFunction.cxx:72

TMVA::HuberLossFunction::fTransitionPoint
Double_t fTransitionPoint
Definition LossFunction.h:169

TMVA::HuberLossFunction::CalculateSumOfWeights
Double_t CalculateSumOfWeights(const std::vector< LossFunctionEventInfo > &evs)
huber, calculate the sum of weights for the events in the vector
Definition LossFunction.cxx:92

TMVA::HuberLossFunction::CalculateMeanLoss
Double_t CalculateMeanLoss(std::vector< LossFunctionEventInfo > &evs)
huber, determine the mean loss for a collection of events
Definition LossFunction.cxx:220

TMVA::HuberLossFunction::Init
void Init(std::vector< LossFunctionEventInfo > &evs)
figure out the residual that determines the separation between the "core" and the "tails" of the resi...
Definition LossFunction.cxx:80

TMVA::HuberLossFunction::CalculateQuantile
Double_t CalculateQuantile(std::vector< LossFunctionEventInfo > &evs, Double_t whichQuantile, Double_t sumOfWeights, bool abs)
huber, determine the quantile for a given input
Definition LossFunction.cxx:117

TMVA::LeastSquaresLossFunctionBDT::SetTargets
void SetTargets(std::vector< const TMVA::Event * > &evs, std::map< const TMVA::Event *, LossFunctionEventInfo > &evinfomap)
least squares BDT, set the targets for a collection of events
Definition LossFunction.cxx:437

TMVA::LeastSquaresLossFunctionBDT::Target
Double_t Target(LossFunctionEventInfo &e)
least squares BDT, set the target for a single event
Definition LossFunction.cxx:459

TMVA::LeastSquaresLossFunctionBDT::Fit
Double_t Fit(std::vector< LossFunctionEventInfo > &evs)
huber BDT, determine the fit value for the terminal node based upon the events in the terminal node
Definition LossFunction.cxx:470

TMVA::LeastSquaresLossFunctionBDT::Init
void Init(std::map< const TMVA::Event *, LossFunctionEventInfo > &evinfomap, std::vector< double > &boostWeights)
least squares BDT, initialize the targets and prepare for the regression
Definition LossFunction.cxx:413

TMVA::LeastSquaresLossFunction::CalculateNetLoss
Double_t CalculateNetLoss(std::vector< LossFunctionEventInfo > &evs)
least squares , determine the net loss for a collection of events
Definition LossFunction.cxx:378

TMVA::LeastSquaresLossFunction::CalculateMeanLoss
Double_t CalculateMeanLoss(std::vector< LossFunctionEventInfo > &evs)
least squares , determine the mean loss for a collection of events
Definition LossFunction.cxx:390

TMVA::LeastSquaresLossFunction::CalculateLoss
Double_t CalculateLoss(LossFunctionEventInfo &e)
least squares , determine the loss for a single event
Definition LossFunction.cxx:368

TMVA::LossFunctionEventInfo
Definition LossFunction.h:48

double

unsigned int

TMath::Min
Short_t Min(Short_t a, Short_t b)
Returns the smallest of a and b.
Definition TMathBase.h:198

TMath::Abs
Short_t Abs(Short_t d)
Returns the absolute value of parameter Short_t d.
Definition TMathBase.h:123

Config.h