doc/v622/RooJohnson_8cxx_source.html

// Author: Stephan Hageboeck, CERN, May 2019

/*****************************************************************************

 * Project: RooFit                                                           *

 * Authors:                                                                  *

 *   WV, Wouter Verkerke, UC Santa Barbara, verkerke@slac.stanford.edu       *

 *   DK, David Kirkby,    UC Irvine,         dkirkby@uci.edu                 *

 *                                                                           *

 * Copyright (c) 2000-2019, Regents of the University of California          *

 *                          and Stanford University. All rights reserved.    *

 *                                                                           *

 * Redistribution and use in source and binary forms,                        *

 * with or without modification, are permitted according to the terms        *

 * listed in LICENSE (http://roofit.sourceforge.net/license.txt)             *

 *****************************************************************************/


/** \class RooJohnson

    \ingroup Roofit


Johnson's \f$ S_{U} \f$ distribution.


This PDF results from transforming a normally distributed variable \f$ x \f$ to this form:

\f[

  z = \gamma + \delta \sinh^{-1}\left( \frac{x - \mu}{\lambda} \right)

\f]

The resulting PDF is

\f[

  \mathrm{PDF}[\mathrm{Johnson}\ S_U] = \frac{\delta}{\lambda\sqrt{2\pi}}

  \frac{1}{\sqrt{1 + \left( \frac{x-\mu}{\lambda} \right)^2}}

  \;\exp\left[-\frac{1}{2} \left(\gamma + \delta \sinh^{-1}\left(\frac{x-\mu}{\lambda}\right) \right)^2\right].

\f]


It is often used to fit a mass difference for charm decays, and therefore the variable \f$ x \f$ is called

"mass" in the implementation. A mass threshold allows to set the PDF to zero to the left of the threshold.


###References:

Johnson, N. L. (1949). *Systems of Frequency Curves Generated by Methods of Translation*. Biometrika **36(1/2)**, 149–176. [doi:10.2307/2332539](https://doi.org/10.2307%2F2332539)


\image html RooJohnson_plot.png


**/


#include "RooJohnson.h"


#include "RooRandom.h"

#include "RooHelpers.h"

#include "BatchHelpers.h"

#include "RooVDTHeaders.h"


#include <cmath>

#include "TMath.h"


using namespace BatchHelpers;


ClassImp(RooJohnson);


////////////////////////////////////////////////////////////////////////////////

/// Construct a new Johnson PDF.

///

/// \param name Name that identifies the PDF in computations

/// \param title Title for plotting

/// \param mass The variable of the PDF. Often this is a mass.

/// \param mu Location parameter of the Gaussian component.

/// \param lambda Width parameter (>0) of the Gaussian component.

/// \param gamma Shape parameter that distorts distribution to left/right.

/// \param delta Shape parameter (>0) that determines strength of Gaussian-like component.

/// \param massThreshold Set PDF to zero below this threshold.

RooJohnson::RooJohnson(const char *name, const char *title,

          RooAbsReal& mass, RooAbsReal& mu, RooAbsReal& lambda,

          RooAbsReal& gamma, RooAbsReal& delta,

          double massThreshold) :

  RooAbsPdf(name,title),

  _mass("mass", "Mass observable", this, mass),

  _mu("mu", "Location parameter of the underlying normal distribution.", this, mu),

  _lambda("lambda", "Width parameter of the underlying normal distribution (=2 lambda)", this, lambda),

  _gamma("gamma", "Shift of transformation", this, gamma),

  _delta("delta", "Scale of transformation", this, delta),

  _massThreshold(massThreshold)

{

  RooHelpers::checkRangeOfParameters(this, {&lambda, &delta}, 0.);

}


////////////////////////////////////////////////////////////////////////////////

/// Copy a Johnson PDF.

RooJohnson::RooJohnson(const RooJohnson& other, const char* newName) :

  RooAbsPdf(other, newName),

  _mass("Mass", this, other._mass),

  _mu("mean", this, other._mu),

  _lambda("lambda", this, other._lambda),

  _gamma("gamma", this, other._gamma),

  _delta("delta", this, other._delta),

  _massThreshold(other._massThreshold)

{


}


////////////////////////////////////////////////////////////////////////////////


double RooJohnson::evaluate() const

{

  if (_mass < _massThreshold)

    return 0.;


  const double arg = (_mass-_mu)/_lambda;

  const double expo = _gamma + _delta * asinh(arg);


  const double result = _delta

      / sqrt(TMath::TwoPi())

      / (_lambda * sqrt(1. + arg*arg))

      * exp(-0.5 * expo * expo);


  return result;

}


////////////////////////////////////////////////////////////////////////////////


namespace {


///Actual computations for the batch evaluation of the Johnson.

///May vectorise over observables depending on types of inputs.

///\note The output and input spans are assumed to be non-overlapping. If they

///overlap, results will likely be garbage.

template<class TMass, class TMu, class TLambda, class TGamma, class TDelta>

void compute(RooSpan<double> output, TMass mass, TMu mu, TLambda lambda, TGamma gamma,

    TDelta delta, double massThreshold) {

  const int n = output.size();


  const double sqrt_twoPi = sqrt(TMath::TwoPi());


  for (int i = 0; i < n; ++i) { //CHECK_VECTORISE

    const double arg = (mass[i] - mu[i]) / lambda[i];

#ifdef R__HAS_VDT

    const double asinh_arg = _rf_fast_log(arg + std::sqrt(arg*arg+1));

#else

    const double asinh_arg = asinh(arg);

#endif

    const double expo = gamma[i] + delta[i] * asinh_arg;

    const double result = delta[i] / sqrt_twoPi

                                   / (lambda[i] * std::sqrt(1. + arg*arg))

                                   * _rf_fast_exp(-0.5 * expo * expo);


    const double passThrough = mass[i] >= massThreshold;

    output[i] = result * passThrough;

  }

}


}


////////////////////////////////////////////////////////////////////////////////

/// Compute \f$ \exp(-0.5 \cdot \frac{(x - \mu)^2}{\sigma^2} \f$ in batches.

/// The local proxies {x, mean, sigma} will be searched for batch input data,

/// and if found, the computation will be batched over their

/// values. If batch data are not found for one of the proxies, the proxies value is assumed to

/// be constant over the batch.

/// \param[in] batchIndex Index of the batch to be computed.

/// \param[in] maxSize Maximal size of the batches. May return smaller batches depending on inputs.

/// \return A span with the computed values.


RooSpan<double> RooJohnson::evaluateBatch(std::size_t begin, std::size_t maxSize) const {

  auto massData   = _mass.getValBatch(begin, maxSize);

  auto muData     = _mu.getValBatch(begin, maxSize);

  auto lambdaData = _lambda.getValBatch(begin, maxSize);

  auto gammaData  = _gamma.getValBatch(begin, maxSize);

  auto deltaData  = _delta.getValBatch(begin, maxSize);


  maxSize = std::min({massData, muData, lambdaData, gammaData, deltaData},

      [](const RooSpan<const double>& l, const RooSpan<const double>& r){

    return l.size() != 0 && l.size() < r.size();

  }).size();


  if (maxSize == 0) {

    return {};

  }


  auto output = _batchData.makeWritableBatchUnInit(begin, maxSize);


  if (!massData.empty()

      && (muData.empty() && lambdaData.empty() && gammaData.empty() && deltaData.empty())) {

    compute(output, massData, BracketAdapter<double>(_mu),

        BracketAdapter<double>(_lambda), BracketAdapter<double>(_gamma),

        BracketAdapter<double>(_delta), _massThreshold);

  }

  else {

    compute(output,

        BracketAdapterWithMask(_mass, massData),

        BracketAdapterWithMask(_mu, muData),

        BracketAdapterWithMask(_lambda, lambdaData),

        BracketAdapterWithMask(_gamma, gammaData),

        BracketAdapterWithMask(_delta, deltaData), _massThreshold);

  }


  return output;

}


////////////////////////////////////////////////////////////////////////////////


int RooJohnson::getAnalyticalIntegral(RooArgSet& allVars, RooArgSet& analVars, const char* /*rangeName*/) const

{

  if (matchArgs(allVars, analVars, _mass)) return kMass;

  if (matchArgs(allVars, analVars, _mu)) return kMean;

  if (matchArgs(allVars, analVars, _lambda)) return kLambda;

  if (matchArgs(allVars, analVars, _gamma)) return kGamma;

  if (matchArgs(allVars, analVars, _delta)) return kDelta;

  //TODO write integral for others

  return 0;

}


////////////////////////////////////////////////////////////////////////////////


double RooJohnson::analyticalIntegral(Int_t code, const char* rangeName) const

{

  //The normalisation constant is left out in evaluate().

  //Therefore, the integral is scaled up by that amount to make RooFit normalise

  //correctly.

  const double globalNorm = 1.;

//  const double globalNorm = sqrt(TMath::TwoPi());


  //Here everything is scaled and shifted such that we only need to compute CDF(Gauss):

  double min = -1.E300;

  double max = 1.E300;

  if (kMass <= code && code <= kLambda) {

    double argMin, argMax;


    if (code == kMass) {

      argMin = (_mass.min(rangeName)-_mu)/_lambda;

      argMax = (_mass.max(rangeName)-_mu)/_lambda;

    } else if (code == kMean) {

      argMin = (_mass-_mu.min(rangeName))/_lambda;

      argMax = (_mass-_mu.max(rangeName))/_lambda;

    } else {

      assert(code == kLambda);

      argMin = (_mass-_mu)/_lambda.min(rangeName);

      argMax = (_mass-_mu)/_lambda.max(rangeName);

    }


    min = _gamma + _delta * asinh(argMin);

    max = _gamma + _delta * asinh(argMax);

  } else if (code == kGamma) {

    const double arg = (_mass-_mu)/_lambda;

    min = _gamma.min(rangeName) + _delta * asinh(arg);

    max = _gamma.max(rangeName) + _delta * asinh(arg);

  } else if (code == kDelta) {

    const double arg = (_mass-_mu)/_lambda;

    min = _gamma + _delta.min(rangeName) * asinh(arg);

    max = _gamma + _delta.max(rangeName) * asinh(arg);

  } else {

    assert(false);

  }


  //Here we go for maximum precision: We compute all integrals in the UPPER

  //tail of the Gaussian, because erfc has the highest precision there.

  //Therefore, the different cases for range limits in the negative hemisphere are mapped onto

  //the equivalent points in the upper hemisphere using erfc(-x) = 2. - erfc(x)

  const double ecmin = std::erfc(std::abs(min/sqrt(2.)));

  const double ecmax = std::erfc(std::abs(max/sqrt(2.)));


  const double result = 0.5 * (

      min*max < 0.0 ? 2.0 - (ecmin + ecmax)

                    : max <= 0. ? ecmax - ecmin : ecmin - ecmax

  );


  // Now, include the global norm that may be missing in evaluate and return

  return globalNorm * (result != 0. ? result : 1.E-300);

}


////////////////////////////////////////////////////////////////////////////////

/// Advertise which kind of direct event generation is supported.

///

/// So far, only generating mass values is supported.

Int_t RooJohnson::getGenerator(const RooArgSet& directVars, RooArgSet &generateVars, Bool_t /*staticInitOK*/) const

{

  if (matchArgs(directVars, generateVars, _mass)) return 1 ;

//  if (matchArgs(directVars, generateVars, _mu)) return 2 ;

  return 0 ;

}


////////////////////////////////////////////////////////////////////////////////

/// Generate events based on code obtained by getGenerator().

///

/// So far, only generating mass values is supported. Others will have to be generated

/// by the slower accept/reject method.

void RooJohnson::generateEvent(Int_t code)

{

  if (code == 1) {

    while (true) {

      const double gauss = RooRandom::randomGenerator()->Gaus(0., 1.);

      const double mass = _lambda * sinh((gauss - _gamma)/_delta) + _mu;

      if (_mass.min() <= mass && mass <= _mass.max() && _massThreshold <= mass) {

        _mass = mass;

        break;

      }

    }

  } else {

    throw std::logic_error("Generation in other variables not yet implemented.");

  }

}

BatchHelpers.h

r
ROOT::R::TRInterface & r
Definition: Object.C:4

RooHelpers.h

RooJohnson.h

RooRandom.h

RooVDTHeaders.h

_rf_fast_exp
double _rf_fast_exp(double x)
VDT headers for RooFit.
Definition: RooVDTHeaders.h:47

_rf_fast_log
double _rf_fast_log(double x)
Definition: RooVDTHeaders.h:51

ClassImp
#define ClassImp(name)
Definition: Rtypes.h:361

name
char name[80]
Definition: TGX11.cxx:109

TMath.h

sinh
double sinh(double)

sqrt
double sqrt(double)

exp
double exp(double)

BatchHelpers::BatchData::makeWritableBatchUnInit
RooSpan< double > makeWritableBatchUnInit(std::size_t begin, std::size_t batchSize, const RooArgSet *const normSet=nullptr, Tag_t ownerTag=kUnspecified)
Make a batch and return a span pointing to the pdf-local memory.
Definition: BatchData.cxx:118

BatchHelpers::BracketAdapterWithMask
Definition: BatchHelpers.h:81

BatchHelpers::BracketAdapter
Little adapter that gives a bracket operator to types that don't have one.
Definition: BatchHelpers.h:58

RooAbsPdf
Definition: RooAbsPdf.h:40

RooAbsReal
RooAbsReal is the common abstract base class for objects that represent a real value and implements f...
Definition: RooAbsReal.h:60

RooAbsReal::matchArgs
Bool_t matchArgs(const RooArgSet &allDeps, RooArgSet &numDeps, const RooArgProxy &a) const
Utility function for use in getAnalyticalIntegral().
Definition: RooAbsReal.cxx:3399

RooAbsReal::_batchData
BatchHelpers::BatchData _batchData
Definition: RooAbsReal.h:450

RooArgSet
RooArgSet is a container object that can hold multiple RooAbsArg objects.
Definition: RooArgSet.h:28

RooJohnson
Johnson's  distribution.
Definition: RooJohnson.h:24

RooJohnson::evaluate
Double_t evaluate() const override
Evaluate this PDF / function / constant. Needs to be overridden by all derived classes.
Definition: RooJohnson.cxx:100

RooJohnson::analyticalIntegral
Double_t analyticalIntegral(Int_t code, const char *rangeName=0) const override
Implements the actual analytical integral(s) advertised by getAnalyticalIntegral.
Definition: RooJohnson.cxx:211

RooJohnson::_mass
RooRealProxy _mass
Definition: RooJohnson.h:50

RooJohnson::kGamma
@ kGamma
Definition: RooJohnson.h:48

RooJohnson::kLambda
@ kLambda
Definition: RooJohnson.h:48

RooJohnson::kDelta
@ kDelta
Definition: RooJohnson.h:48

RooJohnson::kMean
@ kMean
Definition: RooJohnson.h:48

RooJohnson::kMass
@ kMass
Definition: RooJohnson.h:48

RooJohnson::_delta
RooRealProxy _delta
Definition: RooJohnson.h:55

RooJohnson::_gamma
RooRealProxy _gamma
Definition: RooJohnson.h:54

RooJohnson::generateEvent
void generateEvent(Int_t code) override
Generate events based on code obtained by getGenerator().
Definition: RooJohnson.cxx:289

RooJohnson::getGenerator
Int_t getGenerator(const RooArgSet &directVars, RooArgSet &generateVars, Bool_t staticInitOK=kTRUE) const override
Advertise which kind of direct event generation is supported.
Definition: RooJohnson.cxx:275

RooJohnson::evaluateBatch
RooSpan< double > evaluateBatch(std::size_t begin, std::size_t end) const override
Compute  in batches.
Definition: RooJohnson.cxx:160

RooJohnson::_mu
RooRealProxy _mu
Definition: RooJohnson.h:51

RooJohnson::_lambda
RooRealProxy _lambda
Definition: RooJohnson.h:52

RooJohnson::_massThreshold
double _massThreshold
Definition: RooJohnson.h:57

RooJohnson::RooJohnson
RooJohnson()
Definition: RooJohnson.h:26

RooJohnson::getAnalyticalIntegral
Int_t getAnalyticalIntegral(RooArgSet &allVars, RooArgSet &analVars, const char *rangeName=0) const override
Interface function getAnalyticalIntergral advertises the analytical integrals that are supported.
Definition: RooJohnson.cxx:198

RooRandom::randomGenerator
static TRandom * randomGenerator()
Return a pointer to a singleton random-number generator implementation.
Definition: RooRandom.cxx:53

RooSpan
A simple container to hold a batch of data values.
Definition: RooSpan.h:32

RooTemplateProxy::min
double min(const char *rname=0) const
Query lower limit of range. This requires the payload to be RooAbsRealLValue or derived.
Definition: RooTemplateProxy.h:286

RooTemplateProxy::max
double max(const char *rname=0) const
Query upper limit of range. This requires the payload to be RooAbsRealLValue or derived.
Definition: RooTemplateProxy.h:288

RooTemplateProxy::getValBatch
RooSpan< const typename T::value_type > getValBatch(std::size_t begin, std::size_t batchSize) const
Retrieve a batch of real or category data.
Definition: RooTemplateProxy.h:264

TRandom::Gaus
virtual Double_t Gaus(Double_t mean=0, Double_t sigma=1)
Samples a random number from the standard Normal (Gaussian) Distribution with the given mean and sigm...
Definition: TRandom.cxx:263

bool

int

ROOT::Math::erfc
double erfc(double x)
Complementary error function.
Definition: SpecFuncMathCore.cxx:44

n
const Int_t n
Definition: legend1.C:16

BatchHelpers
Definition: BatchData.h:27

ROOT::Math::Cephes::gamma
double gamma(double x)
Definition: SpecFuncCephes.cxx:339

RooHelpers::checkRangeOfParameters
void checkRangeOfParameters(const RooAbsReal *callingClass, std::initializer_list< const RooAbsReal * > pars, double min=-std::numeric_limits< double >::max(), double max=std::numeric_limits< double >::max(), bool limitsInAllowedRange=false, std::string extraMessage="")
Check if the parameters have a range, and warn if the range extends below / above the set limits.
Definition: RooHelpers.cxx:118

TGeant4Unit::gauss
static constexpr double gauss
Definition: TGeant4SystemOfUnits.h:263

TMath::TwoPi
constexpr Double_t TwoPi()
Definition: TMath.h:45

l
auto * l
Definition: textangle.C:4

output
static void output(int code)
Definition: gifencode.c:226