doc/master/HypoTestResult_8cxx_source.html

// @(#)root/roostats:$Id$

// Author: Kyle Cranmer, Lorenzo Moneta, Gregory Schott, Wouter Verkerke, Sven Kreiss

/*************************************************************************

 * Copyright (C) 1995-2008, Rene Brun and Fons Rademakers.               *

 * All rights reserved.                                                  *

 *                                                                       *

 * For the licensing terms see $ROOTSYS/LICENSE.                         *

 * For the list of contributors see $ROOTSYS/README/CREDITS.             *

 *************************************************************************/


/*****************************************************************************

 * Project: RooStats

 * Package: RooFit/RooStats

 * @(#)root/roofit/roostats:$Id$

 * Authors:

 *   Kyle Cranmer, Lorenzo Moneta, Gregory Schott, Wouter Verkerke, Sven Kreiss

 *

 *****************************************************************************/


/** \class RooStats::HypoTestResult

    \ingroup Roostats


HypoTestResult is a base class for results from hypothesis tests.

Any tool inheriting from HypoTestCalculator can return a HypoTestResult.

As such, it stores a p-value for the null-hypothesis (eg. background-only)

and an alternate hypothesis (eg. signal+background).

The p-values can also be transformed into confidence levels

(\f$CL_{b}\f$, \f$CL_{s+b}\f$) in a trivial way.

The ratio of the \f$CL_{s+b}\f$ to \f$CL_{b}\f$ is often called

\f$CL_{s}\f$, and is considered useful, though it is not a probability.

Finally, the p-value of the null can be transformed into a number of

equivalent Gaussian sigma using the Significance method.


The p-value of the null for a given test statistic is rigorously defined and

this is the starting point for the following conventions.


### Conventions used in this class


The p-value for the null and alternate are on the **same side** of the

observed value of the test statistic. This is the more standard

convention and avoids confusion when doing inverted tests.


For exclusion, we also want the formula \f$CL_{s} = CL_{s+b} / CL_{b}\f$

to hold which therefore defines our conventions for \f$CL_{s+b}\f$ and

\f$CL_{b}\f$. \f$CL_{s}\f$ was specifically invented for exclusion

and therefore all quantities need be related through the assignments

as they are for exclusion: \f$CL_{s+b} = p_{s+b}\f$; \f$CL_{b} = p_{b}\f$. This

is derived by considering the scenarios of a powerful and not powerful

inverted test, where for the not so powerful test, \f$CL_{s}\f$ must be

close to one.


For results of Hypothesis tests,

\f$CL_{s}\f$ has no similar direct interpretation as for exclusion and can

be larger than one.


*/


#include "RooStats/HypoTestResult.h"

#include "RooStats/SamplingDistribution.h"

#include "RooAbsReal.h"


#include "RooStats/RooStatsUtils.h"


#include <TMath.h>


#include <limits>

#define NaN numeric_limits<float>::quiet_NaN()

#define IsNaN(a) TMath::IsNaN(a)


using namespace RooStats;

using std::numeric_limits, std::endl;


////////////////////////////////////////////////////////////////////////////////

/// Default constructor


HypoTestResult::HypoTestResult(const char* name) :

   TNamed(name,name),

   fNullPValue(NaN), fAlternatePValue(NaN),

   fNullPValueError(0), fAlternatePValueError(0),

   fTestStatisticData(NaN),

   fAllTestStatisticsData(nullptr),

   fNullDistr(nullptr), fAltDistr(nullptr),

   fNullDetailedOutput(nullptr), fAltDetailedOutput(nullptr),

   fPValueIsRightTail(true),

   fBackgroundIsAlt(false)

{

}


////////////////////////////////////////////////////////////////////////////////

/// Alternate constructor


HypoTestResult::HypoTestResult(const char* name, double nullp, double altp) :

   TNamed(name,name),

   fNullPValue(nullp), fAlternatePValue(altp),

   fNullPValueError(0), fAlternatePValueError(0),

   fTestStatisticData(NaN),

   fAllTestStatisticsData(nullptr),

   fNullDistr(nullptr), fAltDistr(nullptr),

   fNullDetailedOutput(nullptr), fAltDetailedOutput(nullptr),

   fPValueIsRightTail(true),

   fBackgroundIsAlt(false)

{

}


////////////////////////////////////////////////////////////////////////////////

/// copy constructor


HypoTestResult::HypoTestResult(const HypoTestResult& other) :

   TNamed(other),

   fNullPValue(other.fNullPValue), fAlternatePValue(other.fAlternatePValue),

   fNullPValueError(other.fNullPValueError), fAlternatePValueError(other.fAlternatePValueError),

   fTestStatisticData(other.fTestStatisticData),

   fAllTestStatisticsData(nullptr),

   fNullDistr(nullptr), fAltDistr(nullptr),

   fNullDetailedOutput(nullptr), fAltDetailedOutput(nullptr),

   fPValueIsRightTail( other.GetPValueIsRightTail() ),

   fBackgroundIsAlt( other.GetBackGroundIsAlt() )

{

   this->Append( &other );

}


////////////////////////////////////////////////////////////////////////////////

/// Destructor


HypoTestResult::~HypoTestResult()

{


}


////////////////////////////////////////////////////////////////////////////////

/// assignment operator


HypoTestResult & HypoTestResult::operator=(const HypoTestResult& other) {

   if (this == &other) return *this;

   SetName(other.GetName());

   SetTitle(other.GetTitle());

   fNullPValue = other.fNullPValue;

   fAlternatePValue = other.fAlternatePValue;

   fNullPValueError = other.fNullPValueError;

   fAlternatePValueError = other.fAlternatePValueError;

   fTestStatisticData = other.fTestStatisticData;


   fAllTestStatisticsData = nullptr;

   fNullDistr = nullptr;

   fAltDistr = nullptr;

   fNullDetailedOutput = nullptr;

   fAltDetailedOutput = nullptr;


   fFitInfo = nullptr;


   fPValueIsRightTail =  other.GetPValueIsRightTail();

   fBackgroundIsAlt = other.GetBackGroundIsAlt();


   this->Append( &other );


   return *this;

}


////////////////////////////////////////////////////////////////////////////////

/// Add additional toy-MC experiments to the current results.

/// Use the data test statistics of the added object if it is not already

/// set (otherwise, ignore the new one).


void HypoTestResult::Append(const HypoTestResult* other) {

   if (fNullDistr) {

      fNullDistr->Add(other->GetNullDistribution());

   } else if (other->GetNullDistribution()) {

      fNullDistr = std::make_unique<SamplingDistribution>(*other->GetNullDistribution());

   }


   if (fAltDistr) {

      fAltDistr->Add(other->GetAltDistribution());

   } else if (other->GetAltDistribution()) {

      fAltDistr = std::make_unique<SamplingDistribution>(*other->GetAltDistribution());

   }


   if( fNullDetailedOutput ) {

      if( other->GetNullDetailedOutput() ) fNullDetailedOutput->append( *other->GetNullDetailedOutput() );

   }else{

      if( other->GetNullDetailedOutput() ) fNullDetailedOutput = std::make_unique<RooDataSet>( *other->GetNullDetailedOutput() );

   }


   if( fAltDetailedOutput ) {

      if( other->GetAltDetailedOutput() ) fAltDetailedOutput->append( *other->GetAltDetailedOutput() );

   }else{

      if( other->GetAltDetailedOutput() ) fAltDetailedOutput = std::make_unique<RooDataSet>( *other->GetAltDetailedOutput() );

   }


   if( fFitInfo ) {

      if( other->GetFitInfo() ) fFitInfo->append( *other->GetFitInfo() );

   }else{

      if( other->GetFitInfo() ) fFitInfo = std::make_unique<RooDataSet>( *other->GetFitInfo());

   }


   // if no data is present use the other HypoTestResult's data

   if(IsNaN(fTestStatisticData)) fTestStatisticData = other->GetTestStatisticData();


   UpdatePValue(fNullDistr.get(), fNullPValue, fNullPValueError, true);

   UpdatePValue(fAltDistr.get(), fAlternatePValue, fAlternatePValueError, false);

}


////////////////////////////////////////////////////////////////////////////////


void HypoTestResult::SetAltDistribution(SamplingDistribution *alt) {

   fAltDistr.reset(alt);

   UpdatePValue(fAltDistr.get(), fAlternatePValue, fAlternatePValueError, false);

}


////////////////////////////////////////////////////////////////////////////////


void HypoTestResult::SetNullDistribution(SamplingDistribution *null) {

   fNullDistr.reset(null);

   UpdatePValue(fNullDistr.get(), fNullPValue, fNullPValueError, true);

}


////////////////////////////////////////////////////////////////////////////////


void HypoTestResult::SetTestStatisticData(const double tsd) {

   fTestStatisticData = tsd;


   UpdatePValue(fNullDistr.get(), fNullPValue, fNullPValueError, true);

   UpdatePValue(fAltDistr.get(), fAlternatePValue, fAlternatePValueError, false);

}


////////////////////////////////////////////////////////////////////////////////


void HypoTestResult::SetAllTestStatisticsData(const RooArgList* tsd) {

   if (tsd) fAllTestStatisticsData.reset(static_cast<const RooArgList*>(tsd->snapshot()));


   if( fAllTestStatisticsData  &&  !fAllTestStatisticsData->empty() ) {

      RooRealVar* firstTS = static_cast<RooRealVar*>(fAllTestStatisticsData->at(0));

      if( firstTS ) SetTestStatisticData( firstTS->getVal() );

   }

}


////////////////////////////////////////////////////////////////////////////////


void HypoTestResult::SetPValueIsRightTail(bool pr) {

   fPValueIsRightTail = pr;


   UpdatePValue(fNullDistr.get(), fNullPValue, fNullPValueError, true);

   UpdatePValue(fAltDistr.get(), fAlternatePValue, fAlternatePValueError, false);

}


////////////////////////////////////////////////////////////////////////////////


bool HypoTestResult::HasTestStatisticData(void) const {

   return !IsNaN(fTestStatisticData);

}


////////////////////////////////////////////////////////////////////////////////


double HypoTestResult::NullPValueError() const {

   // compute error on Null pvalue

   return fNullPValueError;

}


////////////////////////////////////////////////////////////////////////////////

/// compute \f$CL_{b}\f$ error

/// \f$CL_{b}\f$ = 1 - NullPValue()

/// must use opposite condition that routine above


double HypoTestResult::CLbError() const {

   return fBackgroundIsAlt ? fAlternatePValueError : fNullPValueError;

}


////////////////////////////////////////////////////////////////////////////////


double HypoTestResult::CLsplusbError() const {

   return fBackgroundIsAlt ? fNullPValueError : fAlternatePValueError;

}


////////////////////////////////////////////////////////////////////////////////

/// Taylor expansion series approximation for standard deviation (error propagation)


double HypoTestResult::SignificanceError() const {

   return NullPValueError() / ROOT::Math::normal_pdf(Significance());

}


////////////////////////////////////////////////////////////////////////////////

/// Returns an estimate of the error on \f$CL_{s}\f$ through combination of the

/// errors on \f$CL_{b}\f$ and \f$CL_{s+b}\f$:

/// \f[

/// \sigma_{CL_s} = CL_s

/// \sqrt{\left( \frac{\sigma_{CL_{s+b}}}{CL_{s+b}} \right)^2 + \left( \frac{\sigma_{CL_{b}}}{CL_{b}} \right)^2}

/// \f]


double HypoTestResult::CLsError() const {

   if(!fAltDistr || !fNullDistr) return 0.0;


   // unsigned const int n_b = fNullDistr->GetSamplingDistribution().size();

   // unsigned const int n_sb = fAltDistr->GetSamplingDistribution().size();


   // if CLb() == 0 CLs = -1 so return a -1 error

   if (CLb() == 0 ) return -1;


   double cl_b_err2 = pow(CLbError(),2);

   double cl_sb_err2 = pow(CLsplusbError(),2);


   return std::sqrt(cl_sb_err2 + cl_b_err2 * pow(CLs(),2))/CLb();

}


////////////////////////////////////////////////////////////////////////////////

/// updates the pvalue if sufficient data is available


void HypoTestResult::UpdatePValue(const SamplingDistribution* distr, double &pvalue, double &perror, bool /*isNull*/) {

   if(IsNaN(fTestStatisticData)) return;

   if(!distr) return;


   /* Got to be careful for discrete distributions:

    * To get the right behaviour for limits, the p-value must

    * include the value of fTestStatistic both for Alt and Null cases

    */

   if(fPValueIsRightTail) {

      pvalue = distr->IntegralAndError(perror, fTestStatisticData, RooNumber::infinity(), true,

                                       true , true );   // always closed interval [ fTestStatistic, inf ]


   }else{

      pvalue = distr->IntegralAndError(perror, -RooNumber::infinity(), fTestStatisticData, true,

                                       true,  true  ); // // always closed  [ -inf, fTestStatistic ]

   }

}


////////////////////////////////////////////////////////////////////////////////

/// Print out some information about the results

/// Note: use Alt/Null labels for the hypotheses here as the Null

/// might be the s+b hypothesis.


void HypoTestResult::Print(Option_t * ) const

{

   bool fromToys = (fAltDistr || fNullDistr);


   std::cout << std::endl << "Results " << GetName() << ": " << std::endl;

   std::cout << " - Null p-value = " << NullPValue();

   if (fromToys) std::cout << " +/- " << NullPValueError();

   std::cout << std::endl;

   std::cout << " - Significance = " << Significance();

   if (fromToys) std::cout << " +/- " << SignificanceError() << " sigma";

   std::cout << std::endl;

   if(fAltDistr)

      std::cout << " - Number of Alt toys: " << fAltDistr->GetSize() << std::endl;

   if(fNullDistr)

      std::cout << " - Number of Null toys: " << fNullDistr->GetSize() << std::endl;


   if (HasTestStatisticData() ) std::cout << " - Test statistic evaluated on data: " << fTestStatisticData << std::endl;

   std::cout << " - CL_b: " << CLb();

   if (fromToys) std::cout << " +/- " << CLbError();

   std::cout << std::endl;

   std::cout << " - CL_s+b: " << CLsplusb();

   if (fromToys) std::cout << " +/- " << CLsplusbError();

   std::cout << std::endl;

   std::cout << " - CL_s: " << CLs();

   if (fromToys) std::cout << " +/- " << CLsError();

   std::cout << std::endl;


   return;

}


NaN
#define NaN
Definition HypoTestResult.cxx:68

IsNaN
#define IsNaN(a)
Definition HypoTestResult.cxx:69

HypoTestResult.h

RooAbsReal.h

NaN
#define NaN
Definition RooLagrangianMorphFunc.cxx:86

RooStatsUtils.h

Option_t
const char Option_t
Definition RtypesCore.h:66

SamplingDistribution.h

TRangeDynCast
ROOT::Detail::TRangeCast< T, true > TRangeDynCast
TRangeDynCast is an adapter class that allows the typed iteration through a TCollection.
Definition TCollection.h:358

name
char name[80]
Definition TGX11.cxx:110

TMath.h

ROOT::Detail::TRangeCast
Definition TCollection.h:311

RooArgList
RooArgList is a container object that can hold multiple RooAbsArg objects.
Definition RooArgList.h:22

RooNumber::infinity
static constexpr double infinity()
Return internal infinity representation.
Definition RooNumber.h:25

RooRealVar
Variable that can be changed from the outside.
Definition RooRealVar.h:37

RooStats::HypoTestResult
HypoTestResult is a base class for results from hypothesis tests.
Definition HypoTestResult.h:22

RooStats::HypoTestResult::fNullDetailedOutput
std::unique_ptr< RooDataSet > fNullDetailedOutput
Definition HypoTestResult.h:136

RooStats::HypoTestResult::UpdatePValue
void UpdatePValue(const SamplingDistribution *distr, double &pvalue, double &perror, bool pIsRightTail)
updates the pvalue if sufficient data is available
Definition HypoTestResult.cxx:309

RooStats::HypoTestResult::Print
void Print(const Option_t *="") const override
Print out some information about the results Note: use Alt/Null labels for the hypotheses here as the...
Definition HypoTestResult.cxx:332

RooStats::HypoTestResult::fPValueIsRightTail
bool fPValueIsRightTail
Definition HypoTestResult.h:139

RooStats::HypoTestResult::fNullPValue
double fNullPValue
p-value for the null hypothesis (small number means disfavoured)
Definition HypoTestResult.h:128

RooStats::HypoTestResult::HasTestStatisticData
bool HasTestStatisticData(void) const
Definition HypoTestResult.cxx:250

RooStats::HypoTestResult::fAlternatePValueError
double fAlternatePValueError
error of p-value for the alternate hypothesis (small number means disfavoured)
Definition HypoTestResult.h:131

RooStats::HypoTestResult::operator=
HypoTestResult & operator=(const HypoTestResult &other)
assignment operator
Definition HypoTestResult.cxx:135

RooStats::HypoTestResult::CLsplusb
virtual double CLsplusb() const
Convert AlternatePValue into a "confidence level".
Definition HypoTestResult.h:61

RooStats::HypoTestResult::fAltDetailedOutput
std::unique_ptr< RooDataSet > fAltDetailedOutput
Definition HypoTestResult.h:137

RooStats::HypoTestResult::SetAllTestStatisticsData
void SetAllTestStatisticsData(const RooArgList *tsd)
Definition HypoTestResult.cxx:230

RooStats::HypoTestResult::Append
virtual void Append(const HypoTestResult *other)
add values from another HypoTestResult
Definition HypoTestResult.cxx:167

RooStats::HypoTestResult::NullPValueError
double NullPValueError() const
The error on the Null p-value.
Definition HypoTestResult.cxx:256

RooStats::HypoTestResult::CLsError
double CLsError() const
The error on the ratio .
Definition HypoTestResult.cxx:291

RooStats::HypoTestResult::Significance
virtual double Significance() const
familiar name for the Null p-value in terms of 1-sided Gaussian significance
Definition HypoTestResult.h:75

RooStats::HypoTestResult::fBackgroundIsAlt
bool fBackgroundIsAlt
Definition HypoTestResult.h:140

RooStats::HypoTestResult::SetNullDistribution
void SetNullDistribution(SamplingDistribution *null)
Definition HypoTestResult.cxx:214

RooStats::HypoTestResult::~HypoTestResult
~HypoTestResult() override
destructor
Definition HypoTestResult.cxx:127

RooStats::HypoTestResult::HypoTestResult
HypoTestResult(const char *name=nullptr)
default constructor
Definition HypoTestResult.cxx:78

RooStats::HypoTestResult::SignificanceError
double SignificanceError() const
The error on the significance, computed from NullPValueError via error propagation.
Definition HypoTestResult.cxx:279

RooStats::HypoTestResult::NullPValue
virtual double NullPValue() const
Return p-value for null hypothesis.
Definition HypoTestResult.h:52

RooStats::HypoTestResult::CLbError
double CLbError() const
The error on the "confidence level" of the null hypothesis.
Definition HypoTestResult.cxx:266

RooStats::HypoTestResult::SetTestStatisticData
void SetTestStatisticData(const double tsd)
Definition HypoTestResult.cxx:221

RooStats::HypoTestResult::CLsplusbError
double CLsplusbError() const
The error on the "confidence level" of the alternative hypothesis.
Definition HypoTestResult.cxx:272

RooStats::HypoTestResult::fNullPValueError
double fNullPValueError
error of p-value for the null hypothesis (small number means disfavoured)
Definition HypoTestResult.h:130

RooStats::HypoTestResult::fTestStatisticData
double fTestStatisticData
result of the test statistic evaluated on data
Definition HypoTestResult.h:132

RooStats::HypoTestResult::SetAltDistribution
void SetAltDistribution(SamplingDistribution *alt)
Definition HypoTestResult.cxx:207

RooStats::HypoTestResult::SetPValueIsRightTail
void SetPValueIsRightTail(bool pr)
Definition HypoTestResult.cxx:241

RooStats::HypoTestResult::fAllTestStatisticsData
std::unique_ptr< const RooArgList > fAllTestStatisticsData
for the case of multiple test statistics, holds all the results
Definition HypoTestResult.h:133

RooStats::HypoTestResult::fFitInfo
std::unique_ptr< RooDataSet > fFitInfo
Definition HypoTestResult.h:138

RooStats::HypoTestResult::fAltDistr
std::unique_ptr< SamplingDistribution > fAltDistr
Definition HypoTestResult.h:135

RooStats::HypoTestResult::CLs
virtual double CLs() const
is simply  (not a method, but a quantity)
Definition HypoTestResult.h:64

RooStats::HypoTestResult::fAlternatePValue
double fAlternatePValue
p-value for the alternate hypothesis (small number means disfavoured)
Definition HypoTestResult.h:129

RooStats::HypoTestResult::fNullDistr
std::unique_ptr< SamplingDistribution > fNullDistr
Definition HypoTestResult.h:134

RooStats::HypoTestResult::CLb
virtual double CLb() const
Convert NullPValue into a "confidence level".
Definition HypoTestResult.h:58

RooStats::SamplingDistribution
This class simply holds a sampling distribution of some test statistic.
Definition SamplingDistribution.h:28

TNamed
The TNamed class is the base class for all named ROOT classes.
Definition TNamed.h:29

TNamed::SetTitle
virtual void SetTitle(const char *title="")
Set the title of the TNamed.
Definition TNamed.cxx:164

TNamed::GetName
const char * GetName() const override
Returns name of object.
Definition TNamed.h:47

TNamed::SetName
virtual void SetName(const char *name)
Set the name of the TNamed.
Definition TNamed.cxx:140

ROOT::Math::normal_pdf
double normal_pdf(double x, double sigma=1, double x0=0)
Probability density function of the normal (Gaussian) distribution with mean x0 and standard deviatio...
Definition PdfFuncMathCore.h:509

RooStats
Namespace for the RooStats classes.
Definition CodegenImpl.h:58