doc/master/rs__numberCountingCombination_8py_source.html

# \file

# \ingroup tutorial_roostats

# \notebook -js

# 'Number Counting Example' RooStats tutorial macro #100

#

# This tutorial shows an example of a combination of

# two searches using number counting with background uncertainty.

#

# The macro uses a RooStats "factory" to construct a PDF

# that represents the two number counting analyses with background

# uncertainties.  The uncertainties are taken into account by

# considering a sideband measurement of a size that corresponds to the

# background uncertainty.  The problem has been studied in these references:

#  - http:#arxiv.org/abs/physics/0511028

#  - http:#arxiv.org/abs/physics/0702156

#  - http:#cdsweb.cern.ch/record/1099969?ln=en

#

# After using the factory to make the model, we use a RooStats

# ProfileLikelihoodCalculator for a Hypothesis test and a confidence interval.

# The calculator takes into account systematics by eliminating nuisance parameters

# with the profile likelihood.  This is equivalent to the method of MINOS.

#

#

# \macro_image

# \macro_output

# \macro_code

#

# \author Kyle Cranmer (C++ version), and P. P. (Python translation)


import numpy as np

import ROOT


# use this order for safety on library loading


# declare three variations on the same tutorial

# rs_numberCountingCombination_expected()

# rs_numberCountingCombination_observed()

# rs_numberCountingCombination_observedWithTau()


# -------------------------------

# main driver to choose one

def rs_numberCountingCombination(flag=1):


    if flag == 1:

        rs_numberCountingCombination_expected()

    if flag == 2:

        rs_numberCountingCombination_observed()

    if flag == 3:

        rs_numberCountingCombination_observedWithTau()


# -------------------------------

def rs_numberCountingCombination_expected():


    ##############

    # An example of a number counting combination with two channels.

    # We consider both hypothesis testing and the equivalent confidence interval.

    ##############


    ##############

    # The Model building stage

    ##############


    # Step 1, define arrays with signal & bkg expectations and background uncertainties

    # note: _c means is a ctype. Used for double*[2]

    #          alternatively you can use cppyy:

    #          cppyy.cppdef("double s[2]";")

    #          s_c = cppyy.gbl.s

    s = np.array([20.0, 10.0])  # expected signal

    b = np.array([100.0, 100.0])  # expected background

    db = np.array([0.0100, 0.0100])  # fractional background uncertainty


    # Step 2, use a RooStats factory to build a PDF for a

    # number counting combination and add it to the workspace.

    # We need to give the signal expectation to relate the masterSignal

    # to the signal contribution in the individual channels.

    # The model neglects correlations in background uncertainty,

    # but they could be added without much change to the example.

    f = ROOT.RooStats.NumberCountingPdfFactory()

    wspace = ROOT.RooWorkspace()

    # debugging

    global gf, gwspace

    gf = f

    gwspace = wspace

    global gs  # list

    gs = s

    # return


    f.AddModel(s, 2, wspace, "TopLevelPdf", "masterSignal")


    # Step 3, use a RooStats factory to add datasets to the workspace.

    # Step 3a.

    # Add the expected data to the workspace

    f.AddExpData(s, b, db, 2, wspace, "ExpectedNumberCountingData")


    # see below for a printout of the workspace

    #  wspace->Print();  #uncomment to see structure of workspace


    ##############

    # The Hypothesis testing stage:

    ##############

    # Step 4, Define the null hypothesis for the calculator

    # Here you need to know the name of the variables corresponding to hypothesis.

    mu = wspace.var("masterSignal")

    poi = ROOT.RooArgSet(mu)

    nullParams = ROOT.RooArgSet("nullParams")

    nullParams.addClone(mu)

    # here we explicitly set the value of the parameters for the null

    nullParams.setRealValue("masterSignal", 0)


    # Step 5, Create a calculator for doing the hypothesis test.

    # because this is a

    plc = ROOT.RooStats.ProfileLikelihoodCalculator(

        wspace["ExpectedNumberCountingData"], wspace["TopLevelPdf"], poi, 0.05, nullParams

    )


    # Step 6, Use the Calculator to get a HypoTestResult

    htr = plc.GetHypoTest()

    assert htr != 0

    print(f"-------------------------------------------------")

    print(f"The p-value for the null is ", htr.NullPValue())

    print(f"Corresponding to a significance of ", htr.Significance())

    print(f"-------------------------------------------------\n\n")


    # expected case should return:

    # -------------------------------------------------

    # The p-value for the null is 0.015294

    # Corresponding to a significance of 2.16239

    # -------------------------------------------------


    ##############

    # #Confidence Interval Stage


    # Step 8, Here we re-use the ProfileLikelihoodCalculator to return a confidence interval.

    # We need to specify what are our parameters of interest

    paramsOfInterest = nullParams  # they are the same as before in this case

    plc.SetParameters(paramsOfInterest)

    lrint = plc.GetInterval()

    lrint.SetConfidenceLevel(0.95)


    # Step 9, make a plot of the likelihood ratio and the interval obtained

    # paramsOfInterest->setRealValue("masterSignal",1.);

    # find limits

    lower = lrint.LowerLimit(mu)

    upper = lrint.UpperLimit(mu)


    c1 = ROOT.TCanvas("myc1", "myc1")

    lrPlot = ROOT.RooStats.LikelihoodIntervalPlot(lrint)

    lrPlot.SetMaximum(3.0)

    lrPlot.Draw()

    c1.Update()

    c1.Draw()

    c1.SaveAs("rs_numberCountingCombination.png")


    # Step 10a. Get upper and lower limits

    print("signal = ", lower)

    print("signal = ", upper)


    # Step 10b, Ask if masterSignal=0 is in the interval.

    # Note, this is equivalent to the question of a 2-sigma hypothesis test:

    # "is the parameter point masterSignal=0 inside the 95% confidence interval?"

    # Since the significance of the Hypothesis test was > 2-sigma it should not be:

    # eg. we exclude masterSignal=0 at 95% confidence.

    paramsOfInterest.setRealValue("masterSignal", 0.0)

    print(f"-------------------------------------------------")

    print(f"Consider this parameter point:")

    paramsOfInterest.first().Print()

    if lrint.IsInInterval(paramsOfInterest):

        print(f"It IS in the interval.")

    else:

        print(f"It is NOT in the interval.")

        print(f"-------------------------------------------------\n\n")


    # Step 10c, We also ask about the parameter point masterSignal=2, which is inside the interval.

    paramsOfInterest.setRealValue("masterSignal", 2.0)

    print(f"-------------------------------------------------")

    print(f"Consider this parameter point:")

    paramsOfInterest.first().Print()

    if lrint.IsInInterval(paramsOfInterest):

        print(f"It IS in the interval.")

    else:

        print(f"It is NOT in the interval.")

        print(f"-------------------------------------------------\n\n")


    del lrint

    del htr

    del wspace

    del poi

    del nullParams


    """

   #

   # Here's an example of what is in the workspace

   #  wspace.Print();

   RooWorkspace(NumberCountingWS) Number Counting WS contents


   variables

   ---------

   (x_0,masterSignal,expected_s_0,b_0,y_0,tau_0,x_1,expected_s_1,b_1,y_1,tau_1)


   p.d.f.s

   -------

   RooProdPdf.joint[ pdfs=(sigRegion_0,sideband_0,sigRegion_1,sideband_1) ] = 2.20148e-08

   RooPoisson.sigRegion_0[ x=x_0 mean=splusb_0 ] = 0.036393

   RooPoisson.sideband_0[ x=y_0 mean=bTau_0 ] = 0.00398939

   RooPoisson.sigRegion_1[ x=x_1 mean=splusb_1 ] = 0.0380088

   RooPoisson.sideband_1[ x=y_1 mean=bTau_1 ] = 0.00398939


   functions

   --------

   RooAddition.splusb_0[ set1=(s_0,b_0) set2=() ] = 120

   RooProduct.s_0[ compRSet=(masterSignal,expected_s_0) compCSet=() ] = 20

   RooProduct.bTau_0[ compRSet=(b_0,tau_0) compCSet=() ] = 10000

   RooAddition.splusb_1[ set1=(s_1,b_1) set2=() ] = 110

   RooProduct.s_1[ compRSet=(masterSignal,expected_s_1) compCSet=() ] = 10

   RooProduct.bTau_1[ compRSet=(b_1,tau_1) compCSet=() ] = 10000


   datasets

   --------

   RooDataSet.ExpectedNumberCountingData(x_0,y_0,x_1,y_1)


   embedded pre-calculated expensive components

   -------------------------------------------

   """


def rs_numberCountingCombination_observed():


    ##############

    # The same example with observed data in a main

    # measurement and an background-only auxiliary

    # measurement with a factor tau more background

    # than in the main measurement.


    ##############

    # The Model building stage

    ##############


    # Step 1, define arrays with signal & bkg expectations and background uncertainties

    # We still need the expectation to relate signal in different channels with the master signal

    s = [20.0, 10.0]  # expected signal

    s_c = (ctypes.c_double * len(s))(*s)


    # Step 2, use a RooStats factory to build a PDF for a

    # number counting combination and add it to the workspace.

    # We need to give the signal expectation to relate the masterSignal

    # to the signal contribution in the individual channels.

    # The model neglects correlations in background uncertainty,

    # but they could be added without much change to the example.

    f = NumberCountingPdfFactory()

    wspace = RooWorkspace()

    f.AddModel(s_c, 2, wspace, "TopLevelPdf", "masterSignal")


    # Step 3, use a RooStats factory to add datasets to the workspace.

    # Add the observed data to the workspace

    mainMeas = [123.0, 117.0]  # observed main measurement

    mainMeas_c = (ctypes.c_double * len(mainMeas))(*mainMeas)

    bkgMeas = [111.23, 98.76]  # observed background

    bkgMeas_c = (ctypes.c_double * len(bkgMeas))(*bkgMeas)

    dbMeas = [0.011, 0.0095]  # observed fractional background uncertainty

    dbMeas_c = (ctypes.c_double * len(bkgMeas))(*dbMeas)

    f.AddData(mainMeas_c, bkgMeas_c, dbMeas_c, 2, wspace, "ObservedNumberCountingData")


    # see below for a printout of the workspace

    #  wspace->Print();  #uncomment to see structure of workspace


    ##############

    # The Hypothesis testing stage:

    ##############

    # Step 4, Define the null hypothesis for the calculator

    # Here you need to know the name of the variables corresponding to hypothesis.

    mu = wspace.var("masterSignal")

    poi = RooArgSet(mu)

    nullParams = RooArgSet("nullParams")

    nullParams.addClone(mu)

    # here we explicitly set the value of the parameters for the null

    nullParams.setRealValue("masterSignal", 0)


    # Step 5, Create a calculator for doing the hypothesis test.

    # because this is a

    plc = ProfileLikelihoodCalculator(

        wspace.data("ObservedNumberCountingData"), wspace.pdf("TopLevelPdf"), poi, 0.05, nullParams

    )


    wspace.var("tau_0").Print()

    wspace.var("tau_1").Print()


    # Step 7, Use the Calculator to get a HypoTestResult

    htr = plc.GetHypoTest()

    print(f"-------------------------------------------------")

    print(f"The p-value for the null is ", htr.NullPValue())

    print(f"Corresponding to a significance of ", htr.Significance())

    print(f"-------------------------------------------------\n\n")


    """

   # observed case should return:

   -------------------------------------------------

   The p-value for the null is 0.0351669

   Corresponding to a significance of 1.80975

   -------------------------------------------------

   """


    ##############

    # Confidence Interval Stage


    # Step 8, Here we re-use the ProfileLikelihoodCalculator to return a confidence interval.

    # We need to specify what are our parameters of interest

    paramsOfInterest = nullParams  # they are the same as before in this case

    plc.SetParameters(paramsOfInterest)

    lrint = plc.GetInterval()

    lrint.SetConfidenceLevel(0.95)


    # Step 9c. Get upper and lower limits

    print("signal = ", lrint.LowerLimit(mu))

    print("signal = ", lrint.UpperLimit(mu))


    del lrint

    del htr

    del wspace

    del nullParams

    del poi


def rs_numberCountingCombination_observedWithTau():


    ##############

    # The same example with observed data in a main

    # measurement and an background-only auxiliary

    # measurement with a factor tau more background

    # than in the main measurement.


    ##############

    # The Model building stage

    ##############


    # Step 1, define arrays with signal & bkg expectations and background uncertainties

    # We still need the expectation to relate signal in different channels with the master signal

    s = [20.0, 10.0]  # expected signal

    s_c = (ctypes.c_double * 2)(*s)


    # Step 2, use a RooStats factory to build a PDF for a

    # number counting combination and add it to the workspace.

    # We need to give the signal expectation to relate the masterSignal

    # to the signal contribution in the individual channels.

    # The model neglects correlations in background uncertainty,

    # but they could be added without much change to the example.

    f = NumberCountingPdfFactory()

    wspace = RooWorkspace()

    f.AddModel(s_c, 2, wspace, "TopLevelPdf", "masterSignal")


    # Step 3, use a RooStats factory to add datasets to the workspace.

    # Add the observed data to the workspace in the on-off problem.

    mainMeas = [123.0, 117.0]  # observed main measurement

    sideband = [11123.0, 9876.0]  # observed sideband

    tau = [100.0, 100.0]  # ratio of bkg in sideband to bkg in main measurement, from experimental design.

    mainMeas_c = (ctypes.c_double * 2)(*mainMeas)

    sideband_c = (ctypes.c_double * 2)(*sideband)

    tau_c = (ctypes.c_double * 2)(*tau)

    f.AddDataWithSideband(mainMeas_c, sideband_c, tau_c, 2, wspace, "ObservedNumberCountingDataWithSideband")


    # see below for a printout of the workspace

    #  wspace.Print();  #uncomment to see structure of workspace


    ##############

    # The Hypothesis testing stage:

    ##############

    # Step 4, Define the null hypothesis for the calculator

    # Here you need to know the name of the variables corresponding to hypothesis.

    mu = wspace.var("masterSignal")

    poi = RooArgSet(mu)

    nullParams = RooArgSet("nullParams")

    nullParams.addClone(mu)

    # here we explicitly set the value of the parameters for the null

    nullParams.setRealValue("masterSignal", 0)


    # Step 5, Create a calculator for doing the hypothesis test.

    # because this is a

    plc = ProfileLikelihoodCalculator(

        wspace.data("ObservedNumberCountingDataWithSideband"), wspace.pdf("TopLevelPdf"), poi, 0.05, nullParams

    )


    # Step 7, Use the Calculator to get a HypoTestResult

    htr = plc.GetHypoTest()

    print(f"-------------------------------------------------")

    print(f"The p-value for the null is ", htr.NullPValue())

    print(f"Corresponding to a significance of ", htr.Significance())

    print(f"-------------------------------------------------\n\n")


    """

   # observed case should return:

   -------------------------------------------------

   The p-value for the null is 0.0352035

   Corresponding to a significance of 1.80928

   -------------------------------------------------

   """


    ##############

    # Confidence Interval Stage


    # Step 8, Here we re-use the ProfileLikelihoodCalculator to return a confidence interval.

    # We need to specify what are our parameters of interest

    paramsOfInterest = nullParams  # they are the same as before in this case

    plc.SetParameters(paramsOfInterest)

    lrint = plc.GetInterval()

    lrint.SetConfidenceLevel(0.95)


    # Step 9c. Get upper and lower limits

    print("signal = ", lrint.LowerLimit(mu))

    print("signal = ", lrint.UpperLimit(mu))


    del lrint

    del htr

    del wspace

    del nullParams

    del poi


rs_numberCountingCombination(flag=1)

len
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char Pixmap_t Pixmap_t PictureAttributes_t attr const char char ret_data h unsigned char height h Atom_t Int_t ULong_t ULong_t unsigned char prop_list Atom_t Atom_t Atom_t Time_t UChar_t len
Definition TGWin32VirtualXProxy.cxx:249

Print
void Print(GNN_Data &d, std::string txt="")
Definition TMVA_SOFIE_GNN_Application.C:59

RooArgSet
RooArgSet is a container object that can hold multiple RooAbsArg objects.
Definition RooArgSet.h:24

RooWorkspace
Persistable container for RooFit projects.
Definition RooWorkspace.h:43

rs_numberCountingCombination
Definition rs_numberCountingCombination.py:1