doc/v630/HypoTestResult_8cxx_source.html

// @(#)root/roostats:$Id$

// Author: Kyle Cranmer, Lorenzo Moneta, Gregory Schott, Wouter Verkerke, Sven Kreiss

/*************************************************************************

 * Copyright (C) 1995-2008, Rene Brun and Fons Rademakers.               *

 * All rights reserved.                                                  *

 *                                                                       *

 * For the licensing terms see $ROOTSYS/LICENSE.                         *

 * For the list of contributors see $ROOTSYS/README/CREDITS.             *

 *************************************************************************/


/*****************************************************************************

 * Project: RooStats

 * Package: RooFit/RooStats

 * @(#)root/roofit/roostats:$Id$

 * Authors:

 *   Kyle Cranmer, Lorenzo Moneta, Gregory Schott, Wouter Verkerke, Sven Kreiss

 *

 *****************************************************************************/


/** \class RooStats::HypoTestResult

    \ingroup Roostats


HypoTestResult is a base class for results from hypothesis tests.

Any tool inheriting from HypoTestCalculator can return a HypoTestResult.

As such, it stores a p-value for the null-hypothesis (eg. background-only)

and an alternate hypothesis (eg. signal+background).

The p-values can also be transformed into confidence levels

(\f$CL_{b}\f$, \f$CL_{s+b}\f$) in a trivial way.

The ratio of the \f$CL_{s+b}\f$ to \f$CL_{b}\f$ is often called

\f$CL_{s}\f$, and is considered useful, though it is not a probability.

Finally, the p-value of the null can be transformed into a number of

equivalent Gaussian sigma using the Significance method.


The p-value of the null for a given test statistic is rigorously defined and

this is the starting point for the following conventions.


### Conventions used in this class


The p-value for the null and alternate are on the **same side** of the

observed value of the test statistic. This is the more standard

convention and avoids confusion when doing inverted tests.


For exclusion, we also want the formula \f$CL_{s} = CL_{s+b} / CL_{b}\f$

to hold which therefore defines our conventions for \f$CL_{s+b}\f$ and

\f$CL_{b}\f$. \f$CL_{s}\f$ was specifically invented for exclusion

and therefore all quantities need be related through the assignments

as they are for exclusion: \f$CL_{s+b} = p_{s+b}\f$; \f$CL_{b} = p_{b}\f$. This

is derived by considering the scenarios of a powerful and not powerful

inverted test, where for the not so powerful test, \f$CL_{s}\f$ must be

close to one.


For results of Hypothesis tests,

\f$CL_{s}\f$ has no similar direct interpretation as for exclusion and can

be larger than one.


*/


#include "RooStats/HypoTestResult.h"

#include "RooStats/SamplingDistribution.h"

#include "RooAbsReal.h"


#include "RooStats/RooStatsUtils.h"


#include <TMath.h>


#include <limits>

#define NaN numeric_limits<float>::quiet_NaN()

#define IsNaN(a) TMath::IsNaN(a)


ClassImp(RooStats::HypoTestResult); ;


using namespace RooStats;

using namespace std;


////////////////////////////////////////////////////////////////////////////////

/// Default constructor


HypoTestResult::HypoTestResult(const char* name) :

   TNamed(name,name),

   fNullPValue(NaN), fAlternatePValue(NaN),

   fNullPValueError(0), fAlternatePValueError(0),

   fTestStatisticData(NaN),

   fAllTestStatisticsData(nullptr),

   fNullDistr(nullptr), fAltDistr(nullptr),

   fNullDetailedOutput(nullptr), fAltDetailedOutput(nullptr),

   fPValueIsRightTail(true),

   fBackgroundIsAlt(false)

{

}


////////////////////////////////////////////////////////////////////////////////

/// Alternate constructor


HypoTestResult::HypoTestResult(const char* name, double nullp, double altp) :

   TNamed(name,name),

   fNullPValue(nullp), fAlternatePValue(altp),

   fNullPValueError(0), fAlternatePValueError(0),

   fTestStatisticData(NaN),

   fAllTestStatisticsData(nullptr),

   fNullDistr(nullptr), fAltDistr(nullptr),

   fNullDetailedOutput(nullptr), fAltDetailedOutput(nullptr),

   fPValueIsRightTail(true),

   fBackgroundIsAlt(false)

{

}


////////////////////////////////////////////////////////////////////////////////

/// copy constructor


HypoTestResult::HypoTestResult(const HypoTestResult& other) :

   TNamed(other),

   fNullPValue(other.fNullPValue), fAlternatePValue(other.fAlternatePValue),

   fNullPValueError(other.fNullPValueError), fAlternatePValueError(other.fAlternatePValueError),

   fTestStatisticData(other.fTestStatisticData),

   fAllTestStatisticsData(nullptr),

   fNullDistr(nullptr), fAltDistr(nullptr),

   fNullDetailedOutput(nullptr), fAltDetailedOutput(nullptr),

   fPValueIsRightTail( other.GetPValueIsRightTail() ),

   fBackgroundIsAlt( other.GetBackGroundIsAlt() )

{

   this->Append( &other );

}


////////////////////////////////////////////////////////////////////////////////

/// Destructor


HypoTestResult::~HypoTestResult()

{

   if( fNullDistr ) delete fNullDistr;

   if( fAltDistr ) delete fAltDistr;


   if( fNullDetailedOutput ) delete fNullDetailedOutput;

   if( fAltDetailedOutput ) delete fAltDetailedOutput;


   if( fAllTestStatisticsData ) delete fAllTestStatisticsData;

}


////////////////////////////////////////////////////////////////////////////////

/// assignment operator


HypoTestResult & HypoTestResult::operator=(const HypoTestResult& other) {

   if (this == &other) return *this;

   SetName(other.GetName());

   SetTitle(other.GetTitle());

   fNullPValue = other.fNullPValue;

   fAlternatePValue = other.fAlternatePValue;

   fNullPValueError = other.fNullPValueError;

   fAlternatePValueError = other.fAlternatePValueError;

   fTestStatisticData = other.fTestStatisticData;


   if( fAllTestStatisticsData ) delete fAllTestStatisticsData;

   fAllTestStatisticsData = nullptr;

   if( fNullDistr ) { delete fNullDistr; fNullDistr = nullptr; }

   if( fAltDistr ) { delete fAltDistr; fAltDistr = nullptr; }

   if( fNullDetailedOutput ) { delete fNullDetailedOutput; fNullDetailedOutput = nullptr; }

   if( fAltDetailedOutput ) { delete fAltDetailedOutput;  fAltDetailedOutput = nullptr; }

   fFitInfo = nullptr;


   fPValueIsRightTail =  other.GetPValueIsRightTail();

   fBackgroundIsAlt = other.GetBackGroundIsAlt();


   this->Append( &other );


   return *this;

}


////////////////////////////////////////////////////////////////////////////////

/// Add additional toy-MC experiments to the current results.

/// Use the data test statistics of the added object if it is not already

/// set (otherwise, ignore the new one).


void HypoTestResult::Append(const HypoTestResult* other) {

   if(fNullDistr)

      fNullDistr->Add(other->GetNullDistribution());

   else

      if(other->GetNullDistribution()) fNullDistr = new SamplingDistribution( *other->GetNullDistribution() );


   if(fAltDistr)

      fAltDistr->Add(other->GetAltDistribution());

   else

      if(other->GetAltDistribution()) fAltDistr = new SamplingDistribution( *other->GetAltDistribution() );


   if( fNullDetailedOutput ) {

      if( other->GetNullDetailedOutput() ) fNullDetailedOutput->append( *other->GetNullDetailedOutput() );

   }else{

      if( other->GetNullDetailedOutput() ) fNullDetailedOutput = new RooDataSet( *other->GetNullDetailedOutput() );

   }


   if( fAltDetailedOutput ) {

      if( other->GetAltDetailedOutput() ) fAltDetailedOutput->append( *other->GetAltDetailedOutput() );

   }else{

      if( other->GetAltDetailedOutput() ) fAltDetailedOutput = new RooDataSet( *other->GetAltDetailedOutput() );

   }


   if( fFitInfo ) {

      if( other->GetFitInfo() ) fFitInfo->append( *other->GetFitInfo() );

   }else{

      if( other->GetFitInfo() ) fFitInfo = std::make_unique<RooDataSet>( *other->GetFitInfo());

   }


   // if no data is present use the other HypoTestResult's data

   if(IsNaN(fTestStatisticData)) fTestStatisticData = other->GetTestStatisticData();


   UpdatePValue(fNullDistr, fNullPValue, fNullPValueError, true);

   UpdatePValue(fAltDistr, fAlternatePValue, fAlternatePValueError, false);

}


////////////////////////////////////////////////////////////////////////////////


void HypoTestResult::SetAltDistribution(SamplingDistribution *alt) {

   fAltDistr = alt;

   UpdatePValue(fAltDistr, fAlternatePValue, fAlternatePValueError, false);

}


////////////////////////////////////////////////////////////////////////////////


void HypoTestResult::SetNullDistribution(SamplingDistribution *null) {

   fNullDistr = null;

   UpdatePValue(fNullDistr, fNullPValue, fNullPValueError, true);

}


////////////////////////////////////////////////////////////////////////////////


void HypoTestResult::SetTestStatisticData(const double tsd) {

   fTestStatisticData = tsd;


   UpdatePValue(fNullDistr, fNullPValue, fNullPValueError, true);

   UpdatePValue(fAltDistr, fAlternatePValue, fAlternatePValueError, false);

}


////////////////////////////////////////////////////////////////////////////////


void HypoTestResult::SetAllTestStatisticsData(const RooArgList* tsd) {

   if (fAllTestStatisticsData) {

      delete fAllTestStatisticsData;

      fAllTestStatisticsData = nullptr;

   }

   if (tsd) fAllTestStatisticsData = (const RooArgList*)tsd->snapshot();


   if( fAllTestStatisticsData  &&  fAllTestStatisticsData->getSize() > 0 ) {

      RooRealVar* firstTS = (RooRealVar*)fAllTestStatisticsData->at(0);

      if( firstTS ) SetTestStatisticData( firstTS->getVal() );

   }

}


////////////////////////////////////////////////////////////////////////////////


void HypoTestResult::SetPValueIsRightTail(bool pr) {

   fPValueIsRightTail = pr;


   UpdatePValue(fNullDistr, fNullPValue, fNullPValueError, true);

   UpdatePValue(fAltDistr, fAlternatePValue, fAlternatePValueError, false);

}


////////////////////////////////////////////////////////////////////////////////


bool HypoTestResult::HasTestStatisticData(void) const {

   return !IsNaN(fTestStatisticData);

}


////////////////////////////////////////////////////////////////////////////////


double HypoTestResult::NullPValueError() const {

   // compute error on Null pvalue

   return fNullPValueError;

}


////////////////////////////////////////////////////////////////////////////////

/// compute \f$CL_{b}\f$ error

/// \f$CL_{b}\f$ = 1 - NullPValue()

/// must use opposite condition that routine above


double HypoTestResult::CLbError() const {

   return fBackgroundIsAlt ? fAlternatePValueError : fNullPValueError;

}


////////////////////////////////////////////////////////////////////////////////


double HypoTestResult::CLsplusbError() const {

   return fBackgroundIsAlt ? fNullPValueError : fAlternatePValueError;

}


////////////////////////////////////////////////////////////////////////////////

/// Taylor expansion series approximation for standard deviation (error propagation)


double HypoTestResult::SignificanceError() const {

   return NullPValueError() / ROOT::Math::normal_pdf(Significance());

}


////////////////////////////////////////////////////////////////////////////////

/// Returns an estimate of the error on \f$CL_{s}\f$ through combination of the

/// errors on \f$CL_{b}\f$ and \f$CL_{s+b}\f$:

/// \f[

/// \sigma_{CL_s} = CL_s

/// \sqrt{\left( \frac{\sigma_{CL_{s+b}}}{CL_{s+b}} \right)^2 + \left( \frac{\sigma_{CL_{b}}}{CL_{b}} \right)^2}

/// \f]


double HypoTestResult::CLsError() const {

   if(!fAltDistr || !fNullDistr) return 0.0;


   // unsigned const int n_b = fNullDistr->GetSamplingDistribution().size();

   // unsigned const int n_sb = fAltDistr->GetSamplingDistribution().size();


   // if CLb() == 0 CLs = -1 so return a -1 error

   if (CLb() == 0 ) return -1;


   double cl_b_err2 = pow(CLbError(),2);

   double cl_sb_err2 = pow(CLsplusbError(),2);


   return TMath::Sqrt(cl_sb_err2 + cl_b_err2 * pow(CLs(),2))/CLb();

}


////////////////////////////////////////////////////////////////////////////////

/// updates the pvalue if sufficient data is available


void HypoTestResult::UpdatePValue(const SamplingDistribution* distr, double &pvalue, double &perror, bool /*isNull*/) {

   if(IsNaN(fTestStatisticData)) return;

   if(!distr) return;


   /* Got to be careful for discrete distributions:

    * To get the right behaviour for limits, the p-value must

    * include the value of fTestStatistic both for Alt and Null cases

    */

   if(fPValueIsRightTail) {

      pvalue = distr->IntegralAndError(perror, fTestStatisticData, RooNumber::infinity(), true,

                                       true , true );   // always closed interval [ fTestStatistic, inf ]


   }else{

      pvalue = distr->IntegralAndError(perror, -RooNumber::infinity(), fTestStatisticData, true,

                                       true,  true  ); // // always closed  [ -inf, fTestStatistic ]

   }

}


////////////////////////////////////////////////////////////////////////////////

/// Print out some information about the results

/// Note: use Alt/Null labels for the hypotheses here as the Null

/// might be the s+b hypothesis.


void HypoTestResult::Print(Option_t * ) const

{

   bool fromToys = (fAltDistr || fNullDistr);


   std::cout << std::endl << "Results " << GetName() << ": " << endl;

   std::cout << " - Null p-value = " << NullPValue();

   if (fromToys) std::cout << " +/- " << NullPValueError();

   std::cout << std::endl;

   std::cout << " - Significance = " << Significance();

   if (fromToys) std::cout << " +/- " << SignificanceError() << " sigma";

   std::cout << std::endl;

   if(fAltDistr)

      std::cout << " - Number of Alt toys: " << fAltDistr->GetSize() << std::endl;

   if(fNullDistr)

      std::cout << " - Number of Null toys: " << fNullDistr->GetSize() << std::endl;


   if (HasTestStatisticData() ) std::cout << " - Test statistic evaluated on data: " << fTestStatisticData << std::endl;

   std::cout << " - CL_b: " << CLb();

   if (fromToys) std::cout << " +/- " << CLbError();

   std::cout << std::endl;

   std::cout << " - CL_s+b: " << CLsplusb();

   if (fromToys) std::cout << " +/- " << CLsplusbError();

   std::cout << std::endl;

   std::cout << " - CL_s: " << CLs();

   if (fromToys) std::cout << " +/- " << CLsError();

   std::cout << std::endl;


   return;

}

NaN
#define NaN
Definition HypoTestResult.cxx:68

IsNaN
#define IsNaN(a)
Definition HypoTestResult.cxx:69

HypoTestResult.h

RooAbsReal.h

NaN
#define NaN
Definition RooLagrangianMorphFunc.cxx:86

RooStatsUtils.h

Option_t
const char Option_t
Definition RtypesCore.h:66

ClassImp
#define ClassImp(name)
Definition Rtypes.h:377

SamplingDistribution.h

name
char name[80]
Definition TGX11.cxx:110

TMath.h

RooAbsCollection::snapshot
RooAbsCollection * snapshot(bool deepCopy=true) const
Take a snap shot of current collection contents.
Definition RooAbsCollection.cxx:220

RooAbsCollection::getSize
Int_t getSize() const
Return the number of elements in the collection.
Definition RooAbsCollection.h:281

RooAbsReal::getVal
double getVal(const RooArgSet *normalisationSet=nullptr) const
Evaluate object.
Definition RooAbsReal.h:103

RooArgList
RooArgList is a container object that can hold multiple RooAbsArg objects.
Definition RooArgList.h:22

RooArgList::at
RooAbsArg * at(Int_t idx) const
Return object at given index, or nullptr if index is out of range.
Definition RooArgList.h:110

RooDataSet
RooDataSet is a container class to hold unbinned data.
Definition RooDataSet.h:57

RooDataSet::append
void append(RooDataSet &data)
Add all data points of given data set to this data set.
Definition RooDataSet.cxx:1272

RooNumber::infinity
static constexpr double infinity()
Return internal infinity representation.
Definition RooNumber.h:25

RooRealVar
RooRealVar represents a variable that can be changed from the outside.
Definition RooRealVar.h:37

RooStats::HypoTestResult
HypoTestResult is a base class for results from hypothesis tests.
Definition HypoTestResult.h:22

RooStats::HypoTestResult::GetFitInfo
RooDataSet * GetFitInfo() const
Definition HypoTestResult.h:74

RooStats::HypoTestResult::fAltDetailedOutput
RooDataSet * fAltDetailedOutput
Definition HypoTestResult.h:130

RooStats::HypoTestResult::UpdatePValue
void UpdatePValue(const SamplingDistribution *distr, double &pvalue, double &perror, bool pIsRightTail)
updates the pvalue if sufficient data is available
Definition HypoTestResult.cxx:318

RooStats::HypoTestResult::Print
void Print(const Option_t *="") const override
Print out some information about the results Note: use Alt/Null labels for the hypotheses here as the...
Definition HypoTestResult.cxx:341

RooStats::HypoTestResult::fPValueIsRightTail
bool fPValueIsRightTail
Definition HypoTestResult.h:132

RooStats::HypoTestResult::fNullPValue
double fNullPValue
p-value for the null hypothesis (small number means disfavoured)
Definition HypoTestResult.h:121

RooStats::HypoTestResult::HasTestStatisticData
bool HasTestStatisticData(void) const
Definition HypoTestResult.cxx:259

RooStats::HypoTestResult::fAlternatePValueError
double fAlternatePValueError
error of p-value for the alternate hypothesis (small number means disfavoured)
Definition HypoTestResult.h:124

RooStats::HypoTestResult::operator=
HypoTestResult & operator=(const HypoTestResult &other)
assignment operator
Definition HypoTestResult.cxx:142

RooStats::HypoTestResult::CLsplusb
virtual double CLsplusb() const
Convert AlternatePValue into a "confidence level".
Definition HypoTestResult.h:54

RooStats::HypoTestResult::SetAllTestStatisticsData
void SetAllTestStatisticsData(const RooArgList *tsd)
Definition HypoTestResult.cxx:235

RooStats::HypoTestResult::GetTestStatisticData
double GetTestStatisticData(void) const
Definition HypoTestResult.h:75

RooStats::HypoTestResult::Append
virtual void Append(const HypoTestResult *other)
add values from another HypoTestResult
Definition HypoTestResult.cxx:173

RooStats::HypoTestResult::NullPValueError
double NullPValueError() const
The error on the Null p-value.
Definition HypoTestResult.cxx:265

RooStats::HypoTestResult::CLsError
double CLsError() const
The error on the ratio .
Definition HypoTestResult.cxx:300

RooStats::HypoTestResult::GetNullDetailedOutput
RooDataSet * GetNullDetailedOutput(void) const
Definition HypoTestResult.h:72

RooStats::HypoTestResult::Significance
virtual double Significance() const
familiar name for the Null p-value in terms of 1-sided Gaussian significance
Definition HypoTestResult.h:68

RooStats::HypoTestResult::fNullDetailedOutput
RooDataSet * fNullDetailedOutput
Definition HypoTestResult.h:129

RooStats::HypoTestResult::fAltDistr
SamplingDistribution * fAltDistr
Definition HypoTestResult.h:128

RooStats::HypoTestResult::GetPValueIsRightTail
bool GetPValueIsRightTail(void) const
Definition HypoTestResult.h:92

RooStats::HypoTestResult::fBackgroundIsAlt
bool fBackgroundIsAlt
Definition HypoTestResult.h:133

RooStats::HypoTestResult::SetNullDistribution
void SetNullDistribution(SamplingDistribution *null)
Definition HypoTestResult.cxx:219

RooStats::HypoTestResult::~HypoTestResult
~HypoTestResult() override
destructor
Definition HypoTestResult.cxx:128

RooStats::HypoTestResult::GetBackGroundIsAlt
bool GetBackGroundIsAlt(void) const
Definition HypoTestResult.h:95

RooStats::HypoTestResult::HypoTestResult
HypoTestResult(const char *name=nullptr)
default constructor
Definition HypoTestResult.cxx:79

RooStats::HypoTestResult::SignificanceError
double SignificanceError() const
The error on the significance, computed from NullPValueError via error propagation.
Definition HypoTestResult.cxx:288

RooStats::HypoTestResult::NullPValue
virtual double NullPValue() const
Return p-value for null hypothesis.
Definition HypoTestResult.h:45

RooStats::HypoTestResult::CLbError
double CLbError() const
The error on the "confidence level" of the null hypothesis.
Definition HypoTestResult.cxx:275

RooStats::HypoTestResult::SetTestStatisticData
void SetTestStatisticData(const double tsd)
Definition HypoTestResult.cxx:226

RooStats::HypoTestResult::CLsplusbError
double CLsplusbError() const
The error on the "confidence level" of the alternative hypothesis.
Definition HypoTestResult.cxx:281

RooStats::HypoTestResult::fNullPValueError
double fNullPValueError
error of p-value for the null hypothesis (small number means disfavoured)
Definition HypoTestResult.h:123

RooStats::HypoTestResult::fTestStatisticData
double fTestStatisticData
result of the test statistic evaluated on data
Definition HypoTestResult.h:125

RooStats::HypoTestResult::SetAltDistribution
void SetAltDistribution(SamplingDistribution *alt)
Definition HypoTestResult.cxx:212

RooStats::HypoTestResult::SetPValueIsRightTail
void SetPValueIsRightTail(bool pr)
Definition HypoTestResult.cxx:250

RooStats::HypoTestResult::GetAltDetailedOutput
RooDataSet * GetAltDetailedOutput(void) const
Definition HypoTestResult.h:73

RooStats::HypoTestResult::fAllTestStatisticsData
const RooArgList * fAllTestStatisticsData
for the case of multiple test statistics, holds all the results
Definition HypoTestResult.h:126

RooStats::HypoTestResult::GetNullDistribution
SamplingDistribution * GetNullDistribution(void) const
Definition HypoTestResult.h:70

RooStats::HypoTestResult::fFitInfo
std::unique_ptr< RooDataSet > fFitInfo
Definition HypoTestResult.h:131

RooStats::HypoTestResult::CLs
virtual double CLs() const
is simply  (not a method, but a quantity)
Definition HypoTestResult.h:57

RooStats::HypoTestResult::fAlternatePValue
double fAlternatePValue
p-value for the alternate hypothesis (small number means disfavoured)
Definition HypoTestResult.h:122

RooStats::HypoTestResult::CLb
virtual double CLb() const
Convert NullPValue into a "confidence level".
Definition HypoTestResult.h:51

RooStats::HypoTestResult::fNullDistr
SamplingDistribution * fNullDistr
Definition HypoTestResult.h:127

RooStats::HypoTestResult::GetAltDistribution
SamplingDistribution * GetAltDistribution(void) const
Definition HypoTestResult.h:71

RooStats::SamplingDistribution
This class simply holds a sampling distribution of some test statistic.
Definition SamplingDistribution.h:28

RooStats::SamplingDistribution::GetSize
Int_t GetSize() const
size of samples
Definition SamplingDistribution.h:62

RooStats::SamplingDistribution::IntegralAndError
double IntegralAndError(double &error, double low, double high, bool normalize=true, bool lowClosed=true, bool highClosed=false) const
numerical integral in these limits including error estimation
Definition SamplingDistribution.cxx:238

RooStats::SamplingDistribution::Add
void Add(const SamplingDistribution *other)
merge two sampling distributions
Definition SamplingDistribution.cxx:153

TNamed
The TNamed class is the base class for all named ROOT classes.
Definition TNamed.h:29

TNamed::SetTitle
virtual void SetTitle(const char *title="")
Set the title of the TNamed.
Definition TNamed.cxx:164

TNamed::GetName
const char * GetName() const override
Returns name of object.
Definition TNamed.h:47

TNamed::GetTitle
const char * GetTitle() const override
Returns title of object.
Definition TNamed.h:48

TNamed::SetName
virtual void SetName(const char *name)
Set the name of the TNamed.
Definition TNamed.cxx:140

ROOT::Math::normal_pdf
double normal_pdf(double x, double sigma=1, double x0=0)
Probability density function of the normal (Gaussian) distribution.
Definition PdfFuncMathCore.h:509

RooStats
Namespace for the RooStats classes.
Definition Asimov.h:19

TMath::Sqrt
Double_t Sqrt(Double_t x)
Returns the square root of x.
Definition TMath.h:662