doc/v614/LDA_8cxx_source.html

 // $Id$
 /**********************************************************************************
  * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *
  * Package: TMVA                                                                  *
  * Class  : LDA                                                                   *
  * Web    : http://tmva.sourceforge.net                                           *
  *                                                                                *
  * Description:                                                                   *
  *      Local LDA method used by MethodKNN to compute MVA value.                  *
  *      This is experimental code under development. This class computes          *
  *      parameters of signal and background PDFs using Gaussian approximation.    *
  *                                                                                *
  * Author:                                                                        *
  *      John Alison John.Alison@cern.ch - University of Pennsylvania, USA         *
  *                                                                                *
  * Copyright (c) 2007:                                                            *
  *      CERN, Switzerland                                                         *
  *      MPI-K Heidelberg, Germany                                                 *
  *      University of Pennsylvania, USA                                           *
  *                                                                                *
  * Redistribution and use in source and binary forms, with or without             *
  * modification, are permitted according to the terms listed in LICENSE           *
  * (http://tmva.sourceforge.net/LICENSE)                                          *
  **********************************************************************************/

 /*! \class TMVA::LDA
 \ingroup TMVA

 */

 // Local
 #include "TMVA/LDA.h"

 // C/C++
 #include <iostream>

 #include "TDecompSVD.h"
 #include "TMatrixF.h"
 #include "TMath.h"

 #include "TMVA/Types.h"
 #include "TMVA/MsgLogger.h"

 /////////////////////////////////////////////////////////////////////////////////
 /// constructor

 TMVA::LDA::LDA( Float_t tolerence, Bool_t debug )
    : fTolerence(tolerence),
      fNumParams(0),
      fSigma(0),
      fSigmaInverse(0),
      fDebug(debug),
      fLogger( new MsgLogger("LDA", (debug?kINFO:kDEBUG)) )
 {
 }

 ////////////////////////////////////////////////////////////////////////////////
 /// destructor

 TMVA::LDA::~LDA()
 {
    delete fLogger;
 }

 ////////////////////////////////////////////////////////////////////////////////
 /// Create LDA matrix using local events found by knn method

 void TMVA::LDA::Initialize(const LDAEvents& inputSignalEvents, const LDAEvents& inputBackgroundEvents)
 {
    Log() << kDEBUG << "There are: " << inputSignalEvents.size() << " input signal events " << Endl;
    Log() << kDEBUG << "There are: " << inputBackgroundEvents.size() << " input background events " << Endl;

    fNumParams = inputSignalEvents[0].size();

    UInt_t numSignalEvents = inputSignalEvents.size();
    UInt_t numBackEvents  = inputBackgroundEvents.size();
    UInt_t numTotalEvents = numSignalEvents + numBackEvents;
    fEventFraction[0] = (Float_t)numBackEvents/numTotalEvents;
    fEventFraction[1] = (Float_t)numSignalEvents/numTotalEvents;
    UInt_t K = 2;

    // get the mean of the signal and background for each parameter
    std::vector<Float_t> m_muSignal (fNumParams,0.0);
    std::vector<Float_t> m_muBackground (fNumParams,0.0);
    for (UInt_t param=0; param < fNumParams; ++param) {
       for (UInt_t eventNumber=0; eventNumber < numSignalEvents; ++eventNumber)
          m_muSignal[param] += inputSignalEvents[eventNumber][param];
       for (UInt_t eventNumber=0; eventNumber < numBackEvents; ++eventNumber)
          m_muBackground[param] += inputBackgroundEvents[eventNumber][param]/numBackEvents;
       if (numSignalEvents > 0) m_muSignal[param] /= numSignalEvents;
       if (numBackEvents > 0 )  m_muBackground[param] /= numBackEvents;
    }
    fMu[0] = m_muBackground;
    fMu[1] = m_muSignal;

    if (fDebug) {
       Log() << kDEBUG << "the signal means" << Endl;
       for (UInt_t param=0; param < fNumParams; ++param)
          Log() << kDEBUG << m_muSignal[param] << Endl;
       Log() << kDEBUG << "the background means" << Endl;
       for (UInt_t param=0; param < inputBackgroundEvents[0].size(); ++param)
          Log() << kDEBUG << m_muBackground[param] << Endl;
    }

    // sigma is a sum of two symmetric matrices, one for the background and one for signal
    // get the matrices separately (def not be the best way to do it!)

    // the signal, background, and total matrix
    TMatrixF sigmaSignal(fNumParams, fNumParams);
    TMatrixF sigmaBack(fNumParams, fNumParams);
    if (fSigma!=0) delete fSigma;
    fSigma = new TMatrixF(fNumParams, fNumParams);
    for (UInt_t row=0; row < fNumParams; ++row) {
       for (UInt_t col=0; col < fNumParams; ++col) {
          sigmaSignal[row][col] = 0;
          sigmaBack[row][col] = 0;
          (*fSigma)[row][col] = 0;
       }
    }

    for (UInt_t eventNumber=0; eventNumber < numSignalEvents; ++eventNumber) {
       for (UInt_t row=0; row < fNumParams; ++row) {
          for (UInt_t col=0; col < fNumParams; ++col) {
             sigmaSignal[row][col] += (inputSignalEvents[eventNumber][row] - m_muSignal[row]) * (inputSignalEvents[eventNumber][col] - m_muSignal[col] );
          }
       }
    }

    for (UInt_t eventNumber=0; eventNumber < numBackEvents; ++eventNumber) {
       for (UInt_t row=0; row < fNumParams; ++row) {
          for (UInt_t col=0; col < fNumParams; ++col) {
             sigmaBack[row][col] += (inputBackgroundEvents[eventNumber][row] - m_muBackground[row]) * (inputBackgroundEvents[eventNumber][col] - m_muBackground[col] );
          }
       }
    }

    // the total matrix
    *fSigma = sigmaBack + sigmaSignal;
    *fSigma *= 1.0/(numTotalEvents - K);

    if (fDebug) {
       Log() << "after filling sigmaSignal" <<Endl;
       sigmaSignal.Print();
       Log() << "after filling sigmaBack" <<Endl;
       sigmaBack.Print();
       Log() << "after filling total Sigma" <<Endl;
       fSigma->Print();
    }

    TDecompSVD solutionSVD = TDecompSVD( *fSigma );
    TMatrixF   decomposed  = TMatrixF( fNumParams, fNumParams );
    TMatrixF diag  ( fNumParams, fNumParams );
    TMatrixF uTrans( fNumParams, fNumParams );
    TMatrixF vTrans( fNumParams, fNumParams );
    if (solutionSVD.Decompose()) {
       for (UInt_t i = 0; i< fNumParams; ++i) {
          if (solutionSVD.GetSig()[i] > fTolerence)
             diag(i,i) = solutionSVD.GetSig()[i];
          else
             diag(i,i) = fTolerence;
       }

       if (fDebug) {
          Log() << "the diagonal" <<Endl;
          diag.Print();
       }

       decomposed = solutionSVD.GetV();
       decomposed *= diag;
       decomposed *= solutionSVD.GetU();

       if (fDebug) {
          Log() << "the decomposition " <<Endl;
          decomposed.Print();
       }

       *fSigmaInverse = uTrans.Transpose(solutionSVD.GetU());
       *fSigmaInverse /= diag;
       *fSigmaInverse *= vTrans.Transpose(solutionSVD.GetV());

       if (fDebug) {
          Log() << "the SigmaInverse " <<Endl;
          fSigmaInverse->Print();

          Log() << "the real " <<Endl;
          fSigma->Invert();
          fSigma->Print();

          Bool_t problem = false;
          for (UInt_t i =0; i< fNumParams; ++i) {
             for (UInt_t j =0; j< fNumParams; ++j) {
                if (TMath::Abs((Float_t)(*fSigma)(i,j) - (Float_t)(*fSigmaInverse)(i,j)) > 0.01) {
                   Log() << "problem, i= "<< i << " j= " << j << Endl;
                   Log() << "Sigma(i,j)= "<< (*fSigma)(i,j) << " SigmaInverse(i,j)= " << (*fSigmaInverse)(i,j) <<Endl;
                   Log() << "The difference is : " << TMath::Abs((Float_t)(*fSigma)(i,j) - (Float_t)(*fSigmaInverse)(i,j)) <<Endl;
                   problem = true;
                }
             }
          }
          if (problem) Log() << kWARNING << "Problem with the inversion!" << Endl;

       }
    }
 }

 ////////////////////////////////////////////////////////////////////////////////
 ///
 /// Probability value using Gaussian approximation
 ///

 Float_t TMVA::LDA::FSub(const std::vector<Float_t>& x, Int_t k)
 {
    Float_t prefactor  = 1.0/(TMath::TwoPi()*TMath::Sqrt(fSigma->Determinant()));
    std::vector<Float_t> m_transPoseTimesSigmaInverse;

    for (UInt_t j=0; j < fNumParams; ++j) {
       Float_t m_temp = 0;
       for (UInt_t i=0; i < fNumParams; ++i) {
          m_temp += (x[i] - fMu[k][i]) * (*fSigmaInverse)(j,i);
       }
       m_transPoseTimesSigmaInverse.push_back(m_temp);
    }

    Float_t exponent = 0.0;
    for (UInt_t i=0; i< fNumParams; ++i) {
       exponent += m_transPoseTimesSigmaInverse[i]*(x[i] - fMu[k][i]);
    }

    exponent *= -0.5;

    return prefactor*TMath::Exp( exponent );
 }

 ////////////////////////////////////////////////////////////////////////////////
 ///
 /// Signal probability with Gaussian approximation
 ///

 Float_t TMVA::LDA::GetProb(const std::vector<Float_t>& x, Int_t k)
 {
    Float_t m_numerator = FSub(x,k)*fEventFraction[k];
    Float_t m_denominator = FSub(x,0)*fEventFraction[0]+FSub(x,1)*fEventFraction[1];

    return m_numerator/m_denominator;
 }

 ////////////////////////////////////////////////////////////////////////////////
 ///
 /// Log likelihood function with Gaussian approximation
 ///

 Float_t TMVA::LDA::GetLogLikelihood( const std::vector<Float_t>& x, Int_t k )
 {
    return TMath::Log( FSub(x,k)/FSub(x,!k) ) + TMath::Log( fEventFraction[k]/fEventFraction[!k] );
 }
TMVA::LDA::LDA
LDA(Float_t tolerence=1.0e-5, Bool_t debug=false)
constructor
Definition: LDA.cxx:47

TMVA::LDA::FSub
Float_t FSub(const std::vector< Float_t > &x, Int_t k)
Probability value using Gaussian approximation.
Definition: LDA.cxx:211

TDecompSVD::GetSig
const TVectorD & GetSig()
Definition: TDecompSVD.h:59

TMVA::LDA::fSigmaInverse
TMatrixF * fSigmaInverse
Definition: LDA.h:74

TMVA::Endl
MsgLogger & Endl(MsgLogger &ml)
Definition: MsgLogger.h:158

TMatrixT::Transpose
TMatrixT< Element > & Transpose(const TMatrixT< Element > &source)
Transpose matrix source.
Definition: TMatrixT.cxx:1469

TMVA::LDA::~LDA
~LDA()
destructor
Definition: LDA.cxx:60

TMath::Log
Double_t Log(Double_t x)
Definition: TMath.h:759

Float_t
float Float_t
Definition: RtypesCore.h:53

TMath::TwoPi
constexpr Double_t TwoPi()

Definition: TMath.h:45

TMatrixF
TMatrixT< Float_t > TMatrixF
Definition: TMatrixFfwd.h:22

TMVA::LDA::fLogger
MsgLogger * fLogger
Definition: LDA.h:78

TMVA::LDA::fMu
std::map< Int_t, std::vector< Float_t > > fMu
Definition: LDA.h:72

Int_t
int Int_t
Definition: RtypesCore.h:41

Bool_t
bool Bool_t
Definition: RtypesCore.h:59

TMVA::LDA::fTolerence
Float_t fTolerence
Definition: LDA.h:70

TObject::Print
virtual void Print(Option_t *option="") const
This method must be overridden when a class wants to print itself.
Definition: TObject.cxx:550

TMatrixT::Determinant
virtual Double_t Determinant() const
Return the matrix determinant.
Definition: TMatrixT.cxx:1361

TMath::Abs
Short_t Abs(Short_t d)
Definition: TMathBase.h:108

TMatrixT
TMatrixT.
Definition: TMatrixDfwd.h:22

TDecompSVD
Single Value Decomposition class.
Definition: TDecompSVD.h:23

x
Double_t x[n]
Definition: legend1.C:17

TMVA::LDA::GetProb
Float_t GetProb(const std::vector< Float_t > &x, Int_t k)
Signal probability with Gaussian approximation.
Definition: LDA.cxx:239

TMVA::LDA::fEventFraction
std::map< Int_t, Float_t > fEventFraction
Definition: LDA.h:75

TDecompSVD::GetU
const TMatrixD & GetU()
Definition: TDecompSVD.h:55

TMatrixT::Invert
TMatrixT< Element > & Invert(Double_t *det=0)
Invert the matrix and calculate its determinant.
Definition: TMatrixT.cxx:1396

TDecompSVD::Decompose
virtual Bool_t Decompose()
SVD decomposition of matrix If the decomposition succeeds, bit kDecomposed is set ...
Definition: TDecompSVD.cxx:123

Types.h

ROOT::Internal::SHA256::K
static const uint32_t K[64]
Definition: RSha256.hxx:148

TMVA::LDA::GetLogLikelihood
Float_t GetLogLikelihood(const std::vector< Float_t > &x, Int_t k)
Log likelihood function with Gaussian approximation.
Definition: LDA.cxx:252

UInt_t
unsigned int UInt_t
Definition: RtypesCore.h:42

MsgLogger.h

TMVA::LDA::fNumParams
UInt_t fNumParams
Definition: LDA.h:71

TMVA::LDA::Initialize
void Initialize(const LDAEvents &inputSignal, const LDAEvents &inputBackground)
Create LDA matrix using local events found by knn method.
Definition: LDA.cxx:68

TMath::Exp
Double_t Exp(Double_t x)
Definition: TMath.h:726

LDA.h

TMVA::LDA::Log
MsgLogger & Log() const
Definition: LDA.h:65

TMVA::MsgLogger
ostringstream derivative to redirect and format output
Definition: MsgLogger.h:59

TMatrixTBase::Print
void Print(Option_t *name="") const
Print the matrix as a table of elements.
Definition: TMatrixTBase.cxx:832

TMVA::LDA::fDebug
Bool_t fDebug
Definition: LDA.h:76

LDAEvents
std::vector< std::vector< Float_t > > LDAEvents
Definition: LDA.h:38

TMatrixF.h

TMVA::LDA::fSigma
TMatrixF * fSigma
Definition: LDA.h:73

TDecompSVD::GetV
const TMatrixD & GetV()
Definition: TDecompSVD.h:57

TMath::Sqrt
Double_t Sqrt(Double_t x)
Definition: TMath.h:690

TMath.h

TDecompSVD.h