doc/v624/RooNLLVar_8cxx_source.html

/*****************************************************************************

 * Project: RooFit                                                           *

 * Package: RooFitCore                                                       *

 * @(#)root/roofitcore:$Id$

 * Authors:                                                                  *

 *   WV, Wouter Verkerke, UC Santa Barbara, verkerke@slac.stanford.edu       *

 *   DK, David Kirkby,    UC Irvine,         dkirkby@uci.edu                 *

 *                                                                           *

 * Copyright (c) 2000-2005, Regents of the University of California          *

 *                          and Stanford University. All rights reserved.    *

 *                                                                           *

 * Redistribution and use in source and binary forms,                        *

 * with or without modification, are permitted according to the terms        *

 * listed in LICENSE (http://roofit.sourceforge.net/license.txt)             *

 *****************************************************************************/


/**

\file RooNLLVar.cxx

\class RooNLLVar

\ingroup Roofitcore


Class RooNLLVar implements a -log(likelihood) calculation from a dataset

and a PDF. The NLL is calculated as

\f[

 \sum_\mathrm{data} -\log( \mathrm{pdf}(x_\mathrm{data}))

\f]

In extended mode, a

\f$ N_\mathrm{expect} - N_\mathrm{observed}*log(N_\mathrm{expect}) \f$ term is added.

**/


#include "RooNLLVar.h"


#include "RooAbsData.h"

#include "RooAbsPdf.h"

#include "RooCmdConfig.h"

#include "RooMsgService.h"

#include "RooAbsDataStore.h"

#include "RooRealMPFE.h"

#include "RooRealSumPdf.h"

#include "RooRealVar.h"

#include "RooProdPdf.h"

#include "RooNaNPacker.h"

#include "RunContext.h"


#ifdef ROOFIT_CHECK_CACHED_VALUES

#include <iomanip>

#endif


#include "TMath.h"

#include "Math/Util.h"


#include <algorithm>


ClassImp(RooNLLVar)


RooArgSet RooNLLVar::_emptySet ;


RooNLLVar::RooNLLVar()

{ }


////////////////////////////////////////////////////////////////////////////////

/// Construct likelihood from given p.d.f and (binned or unbinned dataset)

///

///  Argument                 | Description

///  -------------------------|------------

///  Extended()               | Include extended term in calculation

///  NumCPU()                 | Activate parallel processing feature

///  Range()                  | Fit only selected region

///  SumCoefRange()           | Set the range in which to interpret the coefficients of RooAddPdf components

///  SplitRange()             | Fit range is split by index category of simultaneous PDF

///  ConditionalObservables() | Define conditional observables

///  Verbose()                | Verbose output of GOF framework classes

///  CloneData()              | Clone input dataset for internal use (default is kTRUE)

///  BatchMode()              | Evaluate batches of data events (faster if PDFs support it)

///  IntegrateBins() | Integrate PDF within each bin. This sets the desired precision. Only useful for binned fits.

RooNLLVar::RooNLLVar(const char *name, const char* title, RooAbsPdf& pdf, RooAbsData& indata,

           const RooCmdArg& arg1, const RooCmdArg& arg2,const RooCmdArg& arg3,

           const RooCmdArg& arg4, const RooCmdArg& arg5,const RooCmdArg& arg6,

           const RooCmdArg& arg7, const RooCmdArg& arg8,const RooCmdArg& arg9) :

  RooAbsOptTestStatistic(name,title,pdf,indata,

          *(const RooArgSet*)RooCmdConfig::decodeObjOnTheFly("RooNLLVar::RooNLLVar","ProjectedObservables",0,&_emptySet

                               ,arg1,arg2,arg3,arg4,arg5,arg6,arg7,arg8,arg9),

          RooCmdConfig::decodeStringOnTheFly("RooNLLVar::RooNLLVar","RangeWithName",0,"",arg1,arg2,arg3,arg4,arg5,arg6,arg7,arg8,arg9).c_str(),

          RooCmdConfig::decodeStringOnTheFly("RooNLLVar::RooNLLVar","AddCoefRange",0,"",arg1,arg2,arg3,arg4,arg5,arg6,arg7,arg8,arg9).c_str(),

          RooCmdConfig::decodeIntOnTheFly("RooNLLVar::RooNLLVar","NumCPU",0,1,arg1,arg2,arg3,arg4,arg5,arg6,arg7,arg8,arg9),

          RooFit::BulkPartition,

          RooCmdConfig::decodeIntOnTheFly("RooNLLVar::RooNLLVar","Verbose",0,1,arg1,arg2,arg3,arg4,arg5,arg6,arg7,arg8,arg9),

          RooCmdConfig::decodeIntOnTheFly("RooNLLVar::RooNLLVar","SplitRange",0,0,arg1,arg2,arg3,arg4,arg5,arg6,arg7,arg8,arg9),

          RooCmdConfig::decodeIntOnTheFly("RooNLLVar::RooNLLVar","CloneData",0,1,arg1,arg2,arg3,arg4,arg5,arg6,arg7,arg8,arg9),

          RooCmdConfig::decodeDoubleOnTheFly("RooNLLVar::RooNLLVar", "IntegrateBins", 0, -1., {arg1,arg2,arg3,arg4,arg5,arg6,arg7,arg8,arg9}))

{

  RooCmdConfig pc("RooNLLVar::RooNLLVar") ;

  pc.allowUndefined() ;

  pc.defineInt("extended","Extended",0,kFALSE) ;

  pc.defineInt("BatchMode", "BatchMode", 0, false);


  pc.process(arg1) ;  pc.process(arg2) ;  pc.process(arg3) ;

  pc.process(arg4) ;  pc.process(arg5) ;  pc.process(arg6) ;

  pc.process(arg7) ;  pc.process(arg8) ;  pc.process(arg9) ;


  _extended = pc.getInt("extended") ;

  _batchEvaluations = pc.getInt("BatchMode");

  _weightSq = kFALSE ;

  _first = kTRUE ;

  _offset = 0.;

  _offsetCarry = 0.;

  _offsetSaveW2 = 0.;

  _offsetCarrySaveW2 = 0.;


  _binnedPdf = 0 ;

}


////////////////////////////////////////////////////////////////////////////////

/// Construct likelihood from given p.d.f and (binned or unbinned dataset)

/// For internal use.


RooNLLVar::RooNLLVar(const char *name, const char *title, RooAbsPdf& pdf, RooAbsData& indata,

           Bool_t extended, const char* rangeName, const char* addCoefRangeName,

           Int_t nCPU, RooFit::MPSplit interleave, Bool_t verbose, Bool_t splitRange, Bool_t cloneData, Bool_t binnedL,

           double integrateBinsPrecision) :

  RooAbsOptTestStatistic(name,title,pdf,indata,RooArgSet(),rangeName,addCoefRangeName,nCPU,interleave,verbose,splitRange,cloneData,

      integrateBinsPrecision),

  _extended(extended),

  _weightSq(kFALSE),

  _first(kTRUE), _offsetSaveW2(0.), _offsetCarrySaveW2(0.)

{

  // If binned likelihood flag is set, pdf is a RooRealSumPdf representing a yield vector

  // for a binned likelihood calculation

  _binnedPdf = binnedL ? (RooRealSumPdf*)_funcClone : 0 ;


  // Retrieve and cache bin widths needed to convert un-normalized binnedPdf values back to yields

  if (_binnedPdf) {


    // The Active label will disable pdf integral calculations

    _binnedPdf->setAttribute("BinnedLikelihoodActive") ;


    RooArgSet* obs = _funcClone->getObservables(_dataClone) ;

    if (obs->getSize()!=1) {

      _binnedPdf = 0 ;

    } else {

      RooRealVar* var = (RooRealVar*) obs->first() ;

      std::list<Double_t>* boundaries = _binnedPdf->binBoundaries(*var,var->getMin(),var->getMax()) ;

      std::list<Double_t>::iterator biter = boundaries->begin() ;

      _binw.resize(boundaries->size()-1) ;

      Double_t lastBound = (*biter) ;

      ++biter ;

      int ibin=0 ;

      while (biter!=boundaries->end()) {

   _binw[ibin] = (*biter) - lastBound ;

   lastBound = (*biter) ;

   ibin++ ;

   ++biter ;

      }

    }

  }

}


////////////////////////////////////////////////////////////////////////////////

/// Construct likelihood from given p.d.f and (binned or unbinned dataset)

/// For internal use.


RooNLLVar::RooNLLVar(const char *name, const char *title, RooAbsPdf& pdf, RooAbsData& indata,

           const RooArgSet& projDeps, Bool_t extended, const char* rangeName,const char* addCoefRangeName,

           Int_t nCPU,RooFit::MPSplit interleave,Bool_t verbose, Bool_t splitRange, Bool_t cloneData, Bool_t binnedL,

           double integrateBinsPrecision) :

  RooAbsOptTestStatistic(name,title,pdf,indata,projDeps,rangeName,addCoefRangeName,nCPU,interleave,verbose,splitRange,cloneData,

      integrateBinsPrecision),

  _extended(extended),

  _weightSq(kFALSE),

  _first(kTRUE), _offsetSaveW2(0.), _offsetCarrySaveW2(0.)

{

  // If binned likelihood flag is set, pdf is a RooRealSumPdf representing a yield vector

  // for a binned likelihood calculation

  _binnedPdf = binnedL ? (RooRealSumPdf*)_funcClone : 0 ;


  // Retrieve and cache bin widths needed to convert un-normalized binnedPdf values back to yields

  if (_binnedPdf) {


    RooArgSet* obs = _funcClone->getObservables(_dataClone) ;

    if (obs->getSize()!=1) {

      _binnedPdf = 0 ;

    } else {

      RooRealVar* var = (RooRealVar*) obs->first() ;

      std::list<Double_t>* boundaries = _binnedPdf->binBoundaries(*var,var->getMin(),var->getMax()) ;

      std::list<Double_t>::iterator biter = boundaries->begin() ;

      _binw.resize(boundaries->size()-1) ;

      Double_t lastBound = (*biter) ;

      ++biter ;

      int ibin=0 ;

      while (biter!=boundaries->end()) {

   _binw[ibin] = (*biter) - lastBound ;

   lastBound = (*biter) ;

   ibin++ ;

   ++biter ;

      }

    }

  }

}


////////////////////////////////////////////////////////////////////////////////

/// Copy constructor


RooNLLVar::RooNLLVar(const RooNLLVar& other, const char* name) :

  RooAbsOptTestStatistic(other,name),

  _extended(other._extended),

  _batchEvaluations(other._batchEvaluations),

  _weightSq(other._weightSq),

  _first(kTRUE), _offsetSaveW2(other._offsetSaveW2),

  _offsetCarrySaveW2(other._offsetCarrySaveW2),

  _binw(other._binw) {

  _binnedPdf = other._binnedPdf ? (RooRealSumPdf*)_funcClone : 0 ;

}


////////////////////////////////////////////////////////////////////////////////

/// Create a test statistic using several properties of the current instance. This is used to duplicate

/// the test statistic in multi-processing scenarios.

RooAbsTestStatistic* RooNLLVar::create(const char *name, const char *title, RooAbsReal& pdf, RooAbsData& adata,

            const RooArgSet& projDeps, const char* rangeName, const char* addCoefRangeName,

            Int_t nCPU, RooFit::MPSplit interleave, bool verbose, bool splitRange, bool binnedL) {

  RooAbsPdf & thePdf = dynamic_cast<RooAbsPdf&>(pdf);

  // check if pdf can be extended

  bool extendedPdf = _extended && thePdf.canBeExtended();

  auto testStat = new RooNLLVar(name, title, thePdf, adata,

      projDeps, extendedPdf , rangeName, addCoefRangeName, nCPU, interleave, verbose, splitRange, false, binnedL,

      _integrateBinsPrecision);

  testStat->batchMode(_batchEvaluations);

  return testStat;

}


////////////////////////////////////////////////////////////////////////////////

/// Destructor


RooNLLVar::~RooNLLVar()

{

}


////////////////////////////////////////////////////////////////////////////////


void RooNLLVar::applyWeightSquared(Bool_t flag)

{

  if (_gofOpMode==Slave) {

    if (flag != _weightSq) {

      _weightSq = flag;

      std::swap(_offset, _offsetSaveW2);

      std::swap(_offsetCarry, _offsetCarrySaveW2);

    }

    setValueDirty();

  } else if ( _gofOpMode==MPMaster) {

    for (Int_t i=0 ; i<_nCPU ; i++)

      _mpfeArray[i]->applyNLLWeightSquared(flag);

  } else if ( _gofOpMode==SimMaster) {

    for (Int_t i=0 ; i<_nGof ; i++)

      ((RooNLLVar*)_gofArray[i])->applyWeightSquared(flag);

  }

}


////////////////////////////////////////////////////////////////////////////////

/// Calculate and return likelihood on subset of data.

/// \param[in] firstEvent First event to be processed.

/// \param[in] lastEvent  First event not to be processed, any more.

/// \param[in] stepSize   Steps between events.

/// \note For batch computations, the step size **must** be one.

///

/// If this an extended likelihood, the extended term is added to the return likelihood

/// in the batch that encounters the event with index 0.


Double_t RooNLLVar::evaluatePartition(std::size_t firstEvent, std::size_t lastEvent, std::size_t stepSize) const

{

  // Throughout the calculation, we use Kahan's algorithm for summing to

  // prevent loss of precision - this is a factor four more expensive than

  // straight addition, but since evaluating the PDF is usually much more

  // expensive than that, we tolerate the additional cost...

  double result(0), carry(0), sumWeight(0);


  RooAbsPdf* pdfClone = (RooAbsPdf*) _funcClone ;


  // cout << "RooNLLVar::evaluatePartition(" << GetName() << ") projDeps = " << (_projDeps?*_projDeps:RooArgSet()) << endl ;


  _dataClone->store()->recalculateCache( _projDeps, firstEvent, lastEvent, stepSize, (_binnedPdf?kFALSE:kTRUE) ) ;


  // If pdf is marked as binned - do a binned likelihood calculation here (sum of log-Poisson for each bin)

  if (_binnedPdf) {

    double sumWeightCarry = 0.;

    for (auto i=firstEvent ; i<lastEvent ; i+=stepSize) {


      _dataClone->get(i) ;


      if (!_dataClone->valid()) continue;


      Double_t eventWeight = _dataClone->weight();


      // Calculate log(Poisson(N|mu) for this bin

      Double_t N = eventWeight ;

      Double_t mu = _binnedPdf->getVal()*_binw[i] ;

      //cout << "RooNLLVar::binnedL(" << GetName() << ") N=" << N << " mu = " << mu << endl ;


      if (mu<=0 && N>0) {


        // Catch error condition: data present where zero events are predicted

        logEvalError(Form("Observed %f events in bin %lu with zero event yield",N,(unsigned long)i)) ;


      } else if (fabs(mu)<1e-10 && fabs(N)<1e-10) {


        // Special handling of this case since log(Poisson(0,0)=0 but can't be calculated with usual log-formula

        // since log(mu)=0. No update of result is required since term=0.


      } else {


        Double_t term = -1*(-mu + N*log(mu) - TMath::LnGamma(N+1)) ;


        // TODO replace by Math::KahanSum

        // Kahan summation of sumWeight

        Double_t y = eventWeight - sumWeightCarry;

        Double_t t = sumWeight + y;

        sumWeightCarry = (t - sumWeight) - y;

        sumWeight = t;


        // Kahan summation of result

        y = term - carry;

        t = result + y;

        carry = (t - result) - y;

        result = t;

      }

    }


  } else { //unbinned PDF


    if (_batchEvaluations) {

      std::tie(result, carry, sumWeight) = computeBatched(stepSize, firstEvent, lastEvent);

#ifdef ROOFIT_CHECK_CACHED_VALUES


      double resultScalar, carryScalar, sumWeightScalar;

      std::tie(resultScalar, carryScalar, sumWeightScalar) =

          computeScalar(stepSize, firstEvent, lastEvent);


      constexpr bool alwaysPrint = false;


      if (alwaysPrint || fabs(result - resultScalar)/resultScalar > 5.E-15) {

        std::cerr << "RooNLLVar: result is off\n\t" << std::setprecision(15) << result

            << "\n\t" << resultScalar << std::endl;

      }


      if (alwaysPrint || fabs(carry - carryScalar)/carryScalar > 500.) {

        std::cerr << "RooNLLVar: carry is far off\n\t" << std::setprecision(15) << carry

            << "\n\t" << carryScalar << std::endl;

      }


      if (alwaysPrint || fabs(sumWeight - sumWeightScalar)/sumWeightScalar > 1.E-15) {

        std::cerr << "RooNLLVar: sumWeight is off\n\t" << std::setprecision(15) << sumWeight

            << "\n\t" << sumWeightScalar << std::endl;

      }


#endif

    } else { //scalar mode

      std::tie(result, carry, sumWeight) = computeScalar(stepSize, firstEvent, lastEvent);

    }


    // include the extended maximum likelihood term, if requested

    if(_extended && _setNum==_extSet) {

      if (_weightSq) {


        // TODO Batch this up

        // Calculate sum of weights-squared here for extended term

        Double_t sumW2(0), sumW2carry(0);

        for (decltype(_dataClone->numEntries()) i = 0; i < _dataClone->numEntries() ; i++) {

          _dataClone->get(i);

          Double_t y = _dataClone->weightSquared() - sumW2carry;

          Double_t t = sumW2 + y;

          sumW2carry = (t - sumW2) - y;

          sumW2 = t;

        }


        Double_t expected= pdfClone->expectedEvents(_dataClone->get());


        // Adjust calculation of extended term with W^2 weighting: adjust poisson such that

        // estimate of Nexpected stays at the same value, but has a different variance, rescale

        // both the observed and expected count of the Poisson with a factor sum[w] / sum[w^2] which is

        // the effective weight of the Poisson term.

        // i.e. change Poisson(Nobs = sum[w]| Nexp ) --> Poisson( sum[w] * sum[w] / sum[w^2] | Nexp * sum[w] / sum[w^2] )

        // weighted by the effective weight  sum[w^2]/ sum[w] in the likelihood.

        // Since here we compute the likelihood with the weight square we need to multiply by the

        // square of the effective weight

        // expectedW = expected * sum[w] / sum[w^2]   : effective expected entries

        // observedW =  sum[w]  * sum[w] / sum[w^2]   : effective observed entries

        // The extended term for the likelihood weighted by the square of the weight will be then:

        //  (sum[w^2]/ sum[w] )^2 * expectedW -  (sum[w^2]/ sum[w] )^2 * observedW * log (expectedW)  and this is

        //  using the previous expressions for expectedW and observedW

        //  sum[w^2] / sum[w] * expected - sum[w^2] * log (expectedW)

        //  and since the weights are constants in the likelihood we can use log(expected) instead of log(expectedW)


        Double_t expectedW2 = expected * sumW2 / _dataClone->sumEntries() ;

        Double_t extra= expectedW2 - sumW2*log(expected );


        // Double_t y = pdfClone->extendedTerm(sumW2, _dataClone->get()) - carry;


        Double_t y = extra - carry ;


        Double_t t = result + y;

        carry = (t - result) - y;

        result = t;

      } else {

        Double_t y = pdfClone->extendedTerm(_dataClone->sumEntries(), _dataClone->get()) - carry;

        Double_t t = result + y;

        carry = (t - result) - y;

        result = t;

      }

    }

  } //unbinned PDF


  // If part of simultaneous PDF normalize probability over

  // number of simultaneous PDFs: -sum(log(p/n)) = -sum(log(p)) + N*log(n)

  if (_simCount>1) {

    Double_t y = sumWeight*log(1.0*_simCount) - carry;

    Double_t t = result + y;

    carry = (t - result) - y;

    result = t;

  }


  // At the end of the first full calculation, wire the caches

  if (_first) {

    _first = kFALSE ;

    _funcClone->wireAllCaches() ;

  }


  // Check if value offset flag is set.

  if (_doOffset) {


    // If no offset is stored enable this feature now

    if (_offset==0 && result !=0 ) {

      coutI(Minimization) << "RooNLLVar::evaluatePartition(" << GetName() << ") first = "<< firstEvent << " last = " << lastEvent << " Likelihood offset now set to " << result << std::endl ;

      _offset = result ;

      _offsetCarry = carry;

    }


    // Subtract offset

    Double_t y = -_offset - (carry + _offsetCarry);

    Double_t t = result + y;

    carry = (t - result) - y;

    result = t;

  }


  _evalCarry = carry;

  return result ;

}


////////////////////////////////////////////////////////////////////////////////

/// Compute probabilites of all data events. Use faster batch interface.

/// \param[in] stepSize Stride when moving through the dataset.

///   \note For batch computations, the step size **must** be one.

/// \param[in] firstEvent  First event to be processed.

/// \param[in] lastEvent   First event not to be processed.

/// \return Tuple with (Kahan sum of probabilities, carry of kahan sum, sum of weights)

std::tuple<double, double, double> RooNLLVar::computeBatched(std::size_t stepSize, std::size_t firstEvent, std::size_t lastEvent) const

{

  const auto nEvents = lastEvent - firstEvent;


  if (stepSize != 1) {

    throw std::invalid_argument(std::string("Error in ") + __FILE__ + ": Step size for batch computations can only be 1.");

  }


  auto pdfClone = static_cast<const RooAbsPdf*>(_funcClone);


  // Create a RunContext that will own the memory where computation results are stored.

  // Holding on to this struct in between function calls will make sure that the memory

  // is only allocated once.

  if (!_evalData) {

    _evalData.reset(new RooBatchCompute::RunContext);

  }

  _evalData->clear();

  _dataClone->getBatches(*_evalData, firstEvent, nEvents);


  auto results = pdfClone->getLogProbabilities(*_evalData, _normSet);


#ifdef ROOFIT_CHECK_CACHED_VALUES


  for (std::size_t evtNo = firstEvent; evtNo < std::min(lastEvent, firstEvent + 10); ++evtNo) {

    _dataClone->get(evtNo);

    assert(_dataClone->valid());

    try {

      // Cross check results with strict tolerance and complain

      BatchInterfaceAccessor::checkBatchComputation(*pdfClone, *_evalData, evtNo-firstEvent, _normSet, 1.E-13);

    } catch (std::exception& e) {

      std::cerr << __FILE__ << ":" << __LINE__ << " ERROR when checking batch computation for event " << evtNo << ":\n"

          << e.what() << std::endl;


      // It becomes a real problem if it's very wrong. We fail in this case:

      try {

        BatchInterfaceAccessor::checkBatchComputation(*pdfClone, *_evalData, evtNo-firstEvent, _normSet, 1.E-9);

      } catch (std::exception& e2) {

        assert(false);

      }

    }

  }


#endif


  // Compute sum of event weights. First check if we need squared weights

  const RooSpan<const double> eventWeights = _dataClone->getWeightBatch(firstEvent, nEvents);

  //Capture member for lambda:

  const bool retrieveSquaredWeights = _weightSq;

  auto retrieveWeight = [&eventWeights, retrieveSquaredWeights](std::size_t i) {

    return retrieveSquaredWeights ? eventWeights[i] * eventWeights[i] : eventWeights[i];

  };


  //Sum the event weights and probabilities

  ROOT::Math::KahanSum<double, 4u> kahanProb;

  double uniformSingleEventWeight{0.0};

  double sumOfWeights;

  if (eventWeights.empty()) {

    uniformSingleEventWeight = retrieveSquaredWeights ? _dataClone->weightSquared() : _dataClone->weight();

    sumOfWeights = nEvents * uniformSingleEventWeight;

    for (std::size_t i = 0; i < results.size(); ++i) { //CHECK_VECTORISE

      kahanProb.AddIndexed(-uniformSingleEventWeight * results[i], i);

    }

  } else {

    assert(results.size() == eventWeights.size());

    ROOT::Math::KahanSum<double, 4u> kahanWeight;

    for (std::size_t i = 0; i < results.size(); ++i) { //CHECK_VECTORISE

      const double weight = retrieveWeight(i);

      kahanProb.AddIndexed(-weight * results[i], i);

      kahanWeight.AddIndexed(weight, i);

    }

    sumOfWeights = kahanWeight.Sum();

  }


  if (std::isnan(kahanProb.Sum())) {

    // Special handling of evaluation errors.

    // We can recover if the bin/event that results in NaN has a weight of zero:

    ROOT::Math::KahanSum<double, 4u> kahanSanitised;

    RooNaNPacker nanPacker;

    for (std::size_t i = 0; i < results.size(); ++i) {

      double weight = eventWeights.empty() ? uniformSingleEventWeight : retrieveWeight(i);


      if (weight == 0.)

        continue;


      if (std::isnan(results[i])) {

        nanPacker.accumulate(results[i]);

      } else {

        kahanSanitised += -weight * results[i];

      }

    }


    // Some events with evaluation errors. Return "badness" of errors.

    if (nanPacker.getPayload() > 0.) {

      return std::tuple<double, double, double>{nanPacker.getNaNWithPayload(), 0., sumOfWeights};

    } else {

      return std::tuple<double, double, double>{kahanSanitised.Sum(), kahanSanitised.Carry(), sumOfWeights};

    }

  }


  return std::tuple<double, double, double>{kahanProb.Sum(), kahanProb.Carry(), sumOfWeights};

}


std::tuple<double, double, double> RooNLLVar::computeScalar(std::size_t stepSize, std::size_t firstEvent, std::size_t lastEvent) const {

  auto pdfClone = static_cast<const RooAbsPdf*>(_funcClone);


  ROOT::Math::KahanSum<double> kahanWeight;

  ROOT::Math::KahanSum<double> kahanProb;

  RooNaNPacker packedNaN(0.f);


  for (auto i=firstEvent; i<lastEvent; i+=stepSize) {

    _dataClone->get(i) ;


    if (!_dataClone->valid()) continue;


    Double_t eventWeight = _dataClone->weight(); //FIXME

    if (0. == eventWeight * eventWeight) continue ;

    if (_weightSq) eventWeight = _dataClone->weightSquared() ;


    const double term = -eventWeight * pdfClone->getLogVal(_normSet);


    kahanWeight.Add(eventWeight);

    kahanProb.Add(term);

    packedNaN.accumulate(term);

  }


  if (packedNaN.getPayload() != 0.) {

    // Some events with evaluation errors. Return "badness" of errors.

    return std::tuple<double, double, double>{packedNaN.getNaNWithPayload(), 0., kahanWeight.Sum()};

  }


  return std::tuple<double, double, double>{kahanProb.Sum(), kahanProb.Carry(), kahanWeight.Sum()};

}

e
#define e(i)
Definition RSha256.hxx:103

RooAbsDataStore.h

RooAbsData.h

RooAbsPdf.h

RooCmdConfig.h

RooMsgService.h

coutI
#define coutI(a)
Definition RooMsgService.h:30

RooNLLVar.h

RooNaNPacker.h

RooProdPdf.h

RooRealMPFE.h

RooRealSumPdf.h

RooRealVar.h

kFALSE
const Bool_t kFALSE
Definition RtypesCore.h:92

Double_t
double Double_t
Definition RtypesCore.h:59

kTRUE
const Bool_t kTRUE
Definition RtypesCore.h:91

ClassImp
#define ClassImp(name)
Definition Rtypes.h:364

RunContext.h

N
#define N

name
char name[80]
Definition TGX11.cxx:110

TMath.h

log
double log(double)

Form
char * Form(const char *fmt,...)

Util.h

BatchInterfaceAccessor::checkBatchComputation
static void checkBatchComputation(const RooAbsReal &theReal, const RooBatchCompute::RunContext &evalData, std::size_t evtNo, const RooArgSet *normSet=nullptr, double relAccuracy=1.E-13)
Definition RooAbsReal.h:586

ROOT::Math::KahanSum
The Kahan summation is a compensated summation algorithm, which significantly reduces numerical error...
Definition Util.h:122

ROOT::Math::KahanSum::Sum
T Sum() const
Definition Util.h:208

ROOT::Math::KahanSum::Carry
T Carry() const
Definition Util.h:223

ROOT::Math::KahanSum::AddIndexed
void AddIndexed(T input, std::size_t index)
Add input to the sum.
Definition Util.h:199

ROOT::Math::KahanSum::Add
void Add(T x)
Single-element accumulation. Will not vectorise.
Definition Util.h:133

RooAbsArg::getObservables
RooArgSet * getObservables(const RooArgSet &set, Bool_t valueOnly=kTRUE) const
Given a set of possible observables, return the observables that this PDF depends on.
Definition RooAbsArg.h:313

RooAbsArg::setAttribute
void setAttribute(const Text_t *name, Bool_t value=kTRUE)
Set (default) or clear a named boolean attribute of this object.
Definition RooAbsArg.cxx:292

RooAbsArg::wireAllCaches
void wireAllCaches()
Definition RooAbsArg.cxx:2297

RooAbsArg::setValueDirty
void setValueDirty()
Mark the element dirty. This forces a re-evaluation when a value is requested.
Definition RooAbsArg.h:508

RooAbsCollection::getSize
Int_t getSize() const
Definition RooAbsCollection.h:182

RooAbsCollection::first
RooAbsArg * first() const
Definition RooAbsCollection.h:187

RooAbsDataStore::recalculateCache
virtual void recalculateCache(const RooArgSet *, Int_t, Int_t, Int_t, Bool_t)
Definition RooAbsDataStore.h:111

RooAbsData
RooAbsData is the common abstract base class for binned and unbinned datasets.
Definition RooAbsData.h:49

RooAbsData::get
virtual const RooArgSet * get() const
Definition RooAbsData.h:92

RooAbsData::store
RooAbsDataStore * store()
Definition RooAbsData.h:68

RooAbsData::getBatches
virtual void getBatches(RooBatchCompute::RunContext &evalData, std::size_t first=0, std::size_t len=std::numeric_limits< std::size_t >::max()) const =0
Retrieve batches of data for each real-valued variable in this dataset.

RooAbsData::getWeightBatch
virtual RooSpan< const double > getWeightBatch(std::size_t first, std::size_t len) const =0
Return event weights of all events in range [first, first+len).

RooAbsData::sumEntries
virtual Double_t sumEntries() const =0
Return effective number of entries in dataset, i.e., sum all weights.

RooAbsData::valid
virtual Bool_t valid() const
Definition RooAbsData.h:98

RooAbsData::weight
virtual Double_t weight() const =0

RooAbsData::weightSquared
virtual Double_t weightSquared() const =0

RooAbsData::numEntries
virtual Int_t numEntries() const
Return number of entries in dataset, i.e., count unweighted entries.
Definition RooAbsData.cxx:307

RooAbsOptTestStatistic
RooAbsOptTestStatistic is the abstract base class for test statistics objects that evaluate a functio...
Definition RooAbsOptTestStatistic.h:28

RooAbsOptTestStatistic::_funcClone
RooAbsReal * _funcClone
Definition RooAbsOptTestStatistic.h:81

RooAbsOptTestStatistic::_normSet
RooArgSet * _normSet
Definition RooAbsOptTestStatistic.h:78

RooAbsOptTestStatistic::_dataClone
RooAbsData * _dataClone
Definition RooAbsOptTestStatistic.h:80

RooAbsOptTestStatistic::_integrateBinsPrecision
double _integrateBinsPrecision
Definition RooAbsOptTestStatistic.h:92

RooAbsOptTestStatistic::_projDeps
RooArgSet * _projDeps
Definition RooAbsOptTestStatistic.h:82

RooAbsPdf
Definition RooAbsPdf.h:43

RooAbsPdf::canBeExtended
Bool_t canBeExtended() const
If true, PDF can provide extended likelihood term.
Definition RooAbsPdf.h:238

RooAbsPdf::extendedTerm
virtual Double_t extendedTerm(Double_t observedEvents, const RooArgSet *nset=0) const
Return the extended likelihood term ( ) of this PDF for the given number of observed events.
Definition RooAbsPdf.cxx:779

RooAbsPdf::expectedEvents
virtual Double_t expectedEvents(const RooArgSet *nset) const
Return expected number of events from this p.d.f for use in extended likelihood calculations.
Definition RooAbsPdf.cxx:3319

RooAbsRealLValue::getMax
virtual Double_t getMax(const char *name=0) const
Get maximum of currently defined range.
Definition RooAbsRealLValue.h:89

RooAbsRealLValue::getMin
virtual Double_t getMin(const char *name=0) const
Get miniminum of currently defined range.
Definition RooAbsRealLValue.h:86

RooAbsReal
RooAbsReal is the common abstract base class for objects that represent a real value and implements f...
Definition RooAbsReal.h:61

RooAbsReal::getVal
Double_t getVal(const RooArgSet *normalisationSet=nullptr) const
Evaluate object.
Definition RooAbsReal.h:91

RooAbsReal::logEvalError
void logEvalError(const char *message, const char *serverValueString=0) const
Log evaluation error message.
Definition RooAbsReal.cxx:3731

RooAbsTestStatistic
RooAbsTestStatistic is the abstract base class for all test statistics.
Definition RooAbsTestStatistic.h:37

RooAbsTestStatistic::_setNum
Int_t _setNum
Definition RooAbsTestStatistic.h:130

RooAbsTestStatistic::_nGof
Int_t _nGof
Number of designated set to calculated extended term.
Definition RooAbsTestStatistic.h:135

RooAbsTestStatistic::_nCPU
Int_t _nCPU
GOF MP Split mode specified by component (when Auto is active)
Definition RooAbsTestStatistic.h:140

RooAbsTestStatistic::_doOffset
Bool_t _doOffset
Definition RooAbsTestStatistic.h:144

RooAbsTestStatistic::_offset
Double_t _offset
Definition RooAbsTestStatistic.h:145

RooAbsTestStatistic::_gofArray
pRooAbsTestStatistic * _gofArray
Definition RooAbsTestStatistic.h:136

RooAbsTestStatistic::_gofOpMode
GOFOpMode _gofOpMode
Is object initialized
Definition RooAbsTestStatistic.h:127

RooAbsTestStatistic::_simCount
Int_t _simCount
Definition RooAbsTestStatistic.h:112

RooAbsTestStatistic::Slave
@ Slave
Definition RooAbsTestStatistic.h:99

RooAbsTestStatistic::MPMaster
@ MPMaster
Definition RooAbsTestStatistic.h:99

RooAbsTestStatistic::SimMaster
@ SimMaster
Definition RooAbsTestStatistic.h:99

RooAbsTestStatistic::_extSet
Int_t _extSet
Definition RooAbsTestStatistic.h:132

RooAbsTestStatistic::_evalCarry
Double_t _evalCarry
avoids loss of precision
Definition RooAbsTestStatistic.h:147

RooAbsTestStatistic::_mpfeArray
pRooRealMPFE * _mpfeArray
Definition RooAbsTestStatistic.h:141

RooAbsTestStatistic::_offsetCarry
Double_t _offsetCarry
Offset.
Definition RooAbsTestStatistic.h:146

RooArgSet
RooArgSet is a container object that can hold multiple RooAbsArg objects.
Definition RooArgSet.h:29

RooCmdArg
RooCmdArg is a named container for two doubles, two integers two object points and three string point...
Definition RooCmdArg.h:27

RooCmdConfig
Class RooCmdConfig is a configurable parser for RooCmdArg named arguments.
Definition RooCmdConfig.h:27

RooNLLVar
Class RooNLLVar implements a -log(likelihood) calculation from a dataset and a PDF.
Definition RooNLLVar.h:30

RooNLLVar::applyWeightSquared
void applyWeightSquared(Bool_t flag)
Definition RooNLLVar.cxx:250

RooNLLVar::RooNLLVar
RooNLLVar()
Definition RooNLLVar.cxx:58

RooNLLVar::_binnedPdf
RooRealSumPdf * _binnedPdf
Definition RooNLLVar.h:89

RooNLLVar::create
virtual RooAbsTestStatistic * create(const char *name, const char *title, RooAbsReal &pdf, RooAbsData &adata, const RooArgSet &projDeps, const char *rangeName, const char *addCoefRangeName=0, Int_t nCPU=1, RooFit::MPSplit interleave=RooFit::BulkPartition, Bool_t verbose=kTRUE, Bool_t splitRange=kFALSE, Bool_t binnedL=kFALSE)
Create a test statistic using several properties of the current instance.
Definition RooNLLVar.cxx:224

RooNLLVar::_extended
Bool_t _extended
Definition RooNLLVar.h:81

RooNLLVar::_batchEvaluations
bool _batchEvaluations
Definition RooNLLVar.h:82

RooNLLVar::_emptySet
static RooArgSet _emptySet
Definition RooNLLVar.h:72

RooNLLVar::~RooNLLVar
virtual ~RooNLLVar()
Destructor.
Definition RooNLLVar.cxx:241

RooNLLVar::_first
Bool_t _first
Definition RooNLLVar.h:84

RooNLLVar::_binw
std::vector< Double_t > _binw
Definition RooNLLVar.h:88

RooNLLVar::_offsetCarrySaveW2
Double_t _offsetCarrySaveW2
Definition RooNLLVar.h:86

RooNLLVar::evaluatePartition
virtual Double_t evaluatePartition(std::size_t firstEvent, std::size_t lastEvent, std::size_t stepSize) const
Calculate and return likelihood on subset of data.
Definition RooNLLVar.cxx:279

RooNLLVar::_offsetSaveW2
Double_t _offsetSaveW2
Definition RooNLLVar.h:85

RooNLLVar::computeBatched
std::tuple< double, double, double > computeBatched(std::size_t stepSize, std::size_t firstEvent, std::size_t lastEvent) const
Compute probabilites of all data events.
Definition RooNLLVar.cxx:474

RooNLLVar::computeScalar
std::tuple< double, double, double > computeScalar(std::size_t stepSize, std::size_t firstEvent, std::size_t lastEvent) const
Definition RooNLLVar.cxx:578

RooNLLVar::_evalData
std::unique_ptr< RooBatchCompute::RunContext > _evalData
Definition RooNLLVar.h:90

RooNLLVar::_weightSq
Bool_t _weightSq
Definition RooNLLVar.h:83

RooRealSumPdf
The class RooRealSumPdf implements a PDF constructed from a sum of functions:
Definition RooRealSumPdf.h:25

RooRealSumPdf::binBoundaries
virtual std::list< Double_t > * binBoundaries(RooAbsRealLValue &, Double_t, Double_t) const
Retrieve bin boundaries if this distribution is binned in obs.
Definition RooRealSumPdf.cxx:468

RooRealVar
RooRealVar represents a variable that can be changed from the outside.
Definition RooRealVar.h:39

RooSpan
A simple container to hold a batch of data values.
Definition RooSpan.h:34

RooSpan::size
constexpr std::span< T >::index_type size() const noexcept
Definition RooSpan.h:121

RooSpan::empty
constexpr bool empty() const noexcept
Definition RooSpan.h:125

TNamed::GetName
virtual const char * GetName() const
Returns name of object.
Definition TNamed.h:47

bool

int

y
Double_t y[n]
Definition legend1.C:17

RooFit
The namespace RooFit contains mostly switches that change the behaviour of functions of PDFs (or othe...
Definition RooCFunction1Binding.h:29

RooFit::MPSplit
MPSplit
Definition RooGlobalFunc.h:70

TMath::LnGamma
Double_t LnGamma(Double_t z)
Computation of ln[gamma(z)] for all z.
Definition TMath.cxx:486

RooBatchCompute::RunContext
This struct enables passing computation data around between elements of a computation graph.
Definition RunContext.h:31

RooNaNPacker
Little struct that can pack a float into the unused bits of the mantissa of a NaN double.
Definition RooNaNPacker.h:28

RooNaNPacker::getPayload
float getPayload() const
Retrieve packed float.
Definition RooNaNPacker.h:85

RooNaNPacker::getNaNWithPayload
double getNaNWithPayload() const
Retrieve a NaN with the current float payload packed into the mantissa.
Definition RooNaNPacker.h:90

RooNaNPacker::accumulate
void accumulate(double val)
Accumulate a packed float from another NaN into this.
Definition RooNaNPacker.h:57